{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 39,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 准备工作\n",
    "from requests_html import HTMLSession\n",
    "from lxml.html import fromstring\n",
    "from random import random\n",
    "import pandas as pd\n",
    "import numpy as np\n",
    "import requests\n",
    "import time\n",
    "import base64\n",
    "import os\n",
    "import re\n",
    "from PIL import Image"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-40-dd1f2cad3fb0>:10: DeprecationWarning: use options instead of chrome_options\n",
      "  driver = webdriver.Chrome( chrome_options = opts) #desired_capabilities=caps,\n"
     ]
    }
   ],
   "source": [
    "from selenium import webdriver\n",
    "from selenium.webdriver.common.desired_capabilities import DesiredCapabilities\n",
    "\n",
    "opts = webdriver.ChromeOptions()\n",
    "opts.add_argument('--no-sandbox')# 解决DevToolsActivePort文件不存在的报错\n",
    "opts.add_argument('window-size=1920x3000') # 指定浏览器分辨率\n",
    "opts.add_argument('--disable-gpu') # 谷歌文档提到需要加上一这个属性来规避bug\n",
    "opts.add_argument('--hide-scrollbars') # 隐藏滚动条, 应对些特殊页面\n",
    "\n",
    "driver = webdriver.Chrome( chrome_options = opts) #desired_capabilities=caps,"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 43,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 进入CNKI\n",
    "driver.get(\"https://www.cnki.net/\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 46,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'中山大学南...'"
      ]
     },
     "execution_count": 46,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "element = driver.find_element_by_id('Ecp_loginShowName1')\n",
    "element.get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 打开高级检索\n",
    "driver.find_element_by_id('highSearch').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 48,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'CDwindow-BE6D1D3D3A25740F8FBF0E2B1B7F55DE'"
      ]
     },
     "execution_count": 48,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "## 当前窗口\n",
    "driver.current_window_handle"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 49,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['CDwindow-BE6D1D3D3A25740F8FBF0E2B1B7F55DE',\n",
       " 'CDwindow-5B989C7D1660390CF02ED17FD9C16541']"
      ]
     },
     "execution_count": 49,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "## 查看所有的窗口信息\n",
    "driver.window_handles"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-50-704fdf3805c1>:2: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[1])\n"
     ]
    }
   ],
   "source": [
    "# 切换窗口\n",
    "driver.switch_to_window(driver.window_handles[1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 选择学术期刊\n",
    "driver.find_element_by_xpath('//li[@data-id=\"xsqk\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 52,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 选择专业检索\n",
    "driver.find_element_by_name('majorSearch').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 53,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 输入关键词\n",
    "\n",
    "element=driver.find_element_by_xpath('/html/body/div[2]/div/div[2]/div/div[1]/div[1]/div[2]/textarea')\n",
    "element.clear()\n",
    "element.send_keys('SU = \"设计\" AND  (TI =\"人工智能\" OR  TI =\"大数据\"  OR TI = \"AI\" OR TI = \"big data\")')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 54,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 选中CSSCI\n",
    "driver.find_element_by_xpath('//input[@key=\"CSI\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 55,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 选中北大核心\n",
    "driver.find_element_by_xpath('//input[@key=\"HX\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 56,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 检索\n",
    "driver.find_element_by_xpath('//input[@value=\"检索\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 57,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'1,370'"
      ]
     },
     "execution_count": 57,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 显示文章数量\n",
    "driver.find_element_by_xpath('//*[@id=\"countPageDiv\"]/span[1]/em').get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 58,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 更换每页文章数量\n",
    "element = driver.find_element_by_xpath('//*[@id=\"perPageDiv\"]/div/i')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 59,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//*[@id=\"perPageDiv\"]/ul/li[3]/a')\n",
    "element.click()\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 60,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 获取详细页链接\n",
    "import re\n",
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 61,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>森林生态站大数据快速存储与索引方法  网络首发</td>\n",
       "      <td>王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福</td>\n",
       "      <td>农业机械学报</td>\n",
       "      <td>2021-07-06 09:48</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》</td>\n",
       "      <td>张诗雨</td>\n",
       "      <td>锻压技术</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>8.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>基于大数据分析的舰船装备寿命测试系统</td>\n",
       "      <td>化雪荟</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-06-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>基于大数据与信息技术的拖拉机零部件供应链</td>\n",
       "      <td>王弥</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>104.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>智能制造和大数据挖掘在农业机械设计中的应用</td>\n",
       "      <td>杜伯阳</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>186.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>基于特征加权的分布式大数据相关性挖掘方法</td>\n",
       "      <td>戴惠丽; 王敬宇</td>\n",
       "      <td>计算机仿真</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>基于AI的车载智能语音识别报警系统研制</td>\n",
       "      <td>苏明; 艾海明; 王东明</td>\n",
       "      <td>传感器与微系统</td>\n",
       "      <td>2021-06-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>165.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>人工智能教育的含义界定与原理挖掘</td>\n",
       "      <td>彭绍东</td>\n",
       "      <td>中国电化教育</td>\n",
       "      <td>2021-06-08</td>\n",
       "      <td>NaN</td>\n",
       "      <td>881.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>9</td>\n",
       "      <td>人工智能应用场景的界定与开发</td>\n",
       "      <td>李梦薇; 徐峰; 高芳</td>\n",
       "      <td>中国科技论坛</td>\n",
       "      <td>2021-06-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>123.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>10</td>\n",
       "      <td>滚刀状态实时诊断技术在超大直径泥水盾构中的应用——以汕头苏埃通道为例</td>\n",
       "      <td>魏晓龙; 林福龙; 孟祥波; 周树亮; 郭俊可</td>\n",
       "      <td>隧道建设(中英文)</td>\n",
       "      <td>2021-06-01 09:56</td>\n",
       "      <td>NaN</td>\n",
       "      <td>78.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>11</td>\n",
       "      <td>近5年图情SSCI期刊人工智能伦理研究文献分析与启示</td>\n",
       "      <td>黄崑; 徐晓婷; 黎安润泽; 徐峰</td>\n",
       "      <td>现代情报</td>\n",
       "      <td>2021-06-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>671.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>12</td>\n",
       "      <td>教育信息化2.0背景下省级教育大数据平台建设研究  网络首发</td>\n",
       "      <td>汤岭球</td>\n",
       "      <td>当代教育论坛</td>\n",
       "      <td>2021-05-26 18:52</td>\n",
       "      <td>NaN</td>\n",
       "      <td>525.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>13</td>\n",
       "      <td>大数据挖掘技术的光流场图像匹配方法设计</td>\n",
       "      <td>黄凯宁; 郭有强; 杨静</td>\n",
       "      <td>激光杂志</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>36.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>14</td>\n",
       "      <td>大数据驱动的船舶航行路径跟踪研究</td>\n",
       "      <td>王冷</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-05-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>15</td>\n",
       "      <td>基于人工智能技术的船舶智能制造系统</td>\n",
       "      <td>聂华; 雷开元</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-05-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>64.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>16</td>\n",
       "      <td>大数据下基于机器学习的项目智能成本管理研究——以A风景园林规划研究院规划设计类项目为例</td>\n",
       "      <td>程平; 彭兰雅; 辜榕容</td>\n",
       "      <td>财会通讯</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>234.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>17</td>\n",
       "      <td>新时期中欧人工智能发展战略与政策环境的比较研究</td>\n",
       "      <td>关皓元; 高杰</td>\n",
       "      <td>管理现代化</td>\n",
       "      <td>2021-05-17 15:21</td>\n",
       "      <td>NaN</td>\n",
       "      <td>342.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>18</td>\n",
       "      <td>大数据技术视域下智慧图书馆伦理危机与控制研究</td>\n",
       "      <td>陆康; 刘慧; 曹畋</td>\n",
       "      <td>高校图书馆工作</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>161.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>19</td>\n",
       "      <td>智能时代的中小学人工智能教育：总体定位与核心内容领域</td>\n",
       "      <td>卢宇; 汤筱玙; 宋佳宸; 余胜泉</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-05-12</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1139.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>20</td>\n",
       "      <td>大数据环境下基于谱机器学习的云物流资源配置</td>\n",
       "      <td>张人龙; 刘小红</td>\n",
       "      <td>统计与决策</td>\n",
       "      <td>2021-05-10 10:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>269.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>21</td>\n",
       "      <td>酶工程：从人工设计到人工智能  网络首发</td>\n",
       "      <td>王雅丽;付友思;陈俊宏;黄佳城;廖浪星</td>\n",
       "      <td>化工学报</td>\n",
       "      <td>2021-05-08 14:42</td>\n",
       "      <td>NaN</td>\n",
       "      <td>228.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>22</td>\n",
       "      <td>论技术向善何以可能——人工智能教育伦理的逻辑起点</td>\n",
       "      <td>孙田琳子</td>\n",
       "      <td>高教探索</td>\n",
       "      <td>2021-05-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>181.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>23</td>\n",
       "      <td>基于大数据的产品族本体造型意象挖掘方法研究  网络首发</td>\n",
       "      <td>王鹏; 朱韦龙</td>\n",
       "      <td>图学学报</td>\n",
       "      <td>2021-04-30 10:50</td>\n",
       "      <td>NaN</td>\n",
       "      <td>185.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>24</td>\n",
       "      <td>基于智能制造和大数据挖掘的农机数字化设计研究</td>\n",
       "      <td>任燕; 崔庚彦</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2021-04-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>238.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>25</td>\n",
       "      <td>语义分析及向量化大数据XSS入侵识别</td>\n",
       "      <td>张海军; 陈映辉</td>\n",
       "      <td>南开大学学报(自然科学版)</td>\n",
       "      <td>2021-04-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>18.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>26</td>\n",
       "      <td>智能化学本评估初探——基于AI教师主讲课堂的试验研究</td>\n",
       "      <td>阮婷婷; 黄甫全; 曾文婕</td>\n",
       "      <td>教育研究与实验</td>\n",
       "      <td>2021-04-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>96.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>27</td>\n",
       "      <td>大数据平台下化工企业消防安全风险分析指标设计</td>\n",
       "      <td>王滨滨;褚新颖;程诚;王禹寒;胡文倩</td>\n",
       "      <td>南开大学学报(自然科学版)</td>\n",
       "      <td>2021-04-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>53.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>28</td>\n",
       "      <td>知识牵引与数据驱动的兵棋AI设计及关键技术  网络首发</td>\n",
       "      <td>程恺; 陈刚; 余晓晗; 刘满; 邵天浩</td>\n",
       "      <td>系统工程与电子技术</td>\n",
       "      <td>2021-04-19 08:31</td>\n",
       "      <td>NaN</td>\n",
       "      <td>140.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>29</td>\n",
       "      <td>基于网络舆情大数据的公共政策评价研究</td>\n",
       "      <td>邱尔丽; 张竞; 王雨舟; 曹攀</td>\n",
       "      <td>领导科学</td>\n",
       "      <td>2021-04-16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>216.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>30</td>\n",
       "      <td>基于Mapreduce的多源多模态大数据检索方法研究</td>\n",
       "      <td>魏秀卓; 赵慧南</td>\n",
       "      <td>计算机仿真</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>71.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>31</td>\n",
       "      <td>从学习效果和教育公平的角度看高等教育人工智能应用——一项基于多个数据库英文同行评审期刊文献的综述</td>\n",
       "      <td>郝丹; 肖俊洪</td>\n",
       "      <td>现代教育技术</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>250.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>32</td>\n",
       "      <td>“城市仿真”大数据平台简介</td>\n",
       "      <td>NaN</td>\n",
       "      <td>交通运输系统工程与信息</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>44.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>33</td>\n",
       "      <td>人工智能非主体性前提下侵权责任承担机制研究</td>\n",
       "      <td>付其运</td>\n",
       "      <td>法学杂志</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>250.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>34</td>\n",
       "      <td>机用碳纤维/ABS复合材料人工智能辅助成型工艺关键技术研究</td>\n",
       "      <td>黄罡</td>\n",
       "      <td>化工新型材料</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>47.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>35</td>\n",
       "      <td>城市轨道交通勘测大数据的集成与应用</td>\n",
       "      <td>任传斌; 于淼; 李珂; 冯增文</td>\n",
       "      <td>地质论评</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>39.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>36</td>\n",
       "      <td>人工智能驱动下智慧养老服务模式构建研究</td>\n",
       "      <td>赵奕钧; 邓大松</td>\n",
       "      <td>江淮论坛</td>\n",
       "      <td>2021-04-12 10:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>980.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>37</td>\n",
       "      <td>电子科技大学周军教授团队在芯片奥林匹克会议ISSCC发表人工智能芯片论文</td>\n",
       "      <td>NaN</td>\n",
       "      <td>信息网络安全</td>\n",
       "      <td>2021-04-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>51.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>38</td>\n",
       "      <td>面向重大公共事务决策风险治理的大数据行动框架</td>\n",
       "      <td>毕凌燕; 张海璇; 左文明</td>\n",
       "      <td>科技管理研究</td>\n",
       "      <td>2021-04-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>67.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>39</td>\n",
       "      <td>共智融合的大数据智能化人才培养研究与实践</td>\n",
       "      <td>冯永; 钟将; 王茜; 李学明</td>\n",
       "      <td>中国电化教育</td>\n",
       "      <td>2021-04-08</td>\n",
       "      <td>NaN</td>\n",
       "      <td>449.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>40</td>\n",
       "      <td>从教学样式到学习范式：人工智能环境下学习的通用设计转化</td>\n",
       "      <td>杨绪辉</td>\n",
       "      <td>中国电化教育</td>\n",
       "      <td>2021-04-08</td>\n",
       "      <td>NaN</td>\n",
       "      <td>336.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>41</td>\n",
       "      <td>人工智能教学中“知识建构、STEM、创客”三位一体教学模型的设计与应用</td>\n",
       "      <td>丁美荣; 王同聚</td>\n",
       "      <td>电化教育研究</td>\n",
       "      <td>2021-04-01</td>\n",
       "      <td>1.0</td>\n",
       "      <td>936.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>42</td>\n",
       "      <td>人工智能环境下广告创意人才的培养</td>\n",
       "      <td>赵朴</td>\n",
       "      <td>出版广角</td>\n",
       "      <td>2021-03-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>110.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>43</td>\n",
       "      <td>基于MapReduce的大数据在线聚集优化设计</td>\n",
       "      <td>李骏</td>\n",
       "      <td>河北大学学报(自然科学版)</td>\n",
       "      <td>2021-03-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>21.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>44</td>\n",
       "      <td>航空大数据研究综述</td>\n",
       "      <td>赵学武;吴宁;王军;阮利;李玲玲</td>\n",
       "      <td>计算机科学与探索</td>\n",
       "      <td>2021-03-23 16:56</td>\n",
       "      <td>NaN</td>\n",
       "      <td>412.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>45</td>\n",
       "      <td>人工智能技术的船舶航行轨迹控制算法</td>\n",
       "      <td>殷慧</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-03-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>60.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>46</td>\n",
       "      <td>大数据挖掘算法无人船信息管理系统</td>\n",
       "      <td>解莹</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-03-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>46.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>47</td>\n",
       "      <td>负责任的人工智能与设计创新</td>\n",
       "      <td>王韫; 徐迎庆</td>\n",
       "      <td>包装工程</td>\n",
       "      <td>2021-03-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>228.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>48</td>\n",
       "      <td>AI设计下的文本视觉问答技术</td>\n",
       "      <td>晋赞霞; 覃京燕; 殷绪成</td>\n",
       "      <td>包装工程</td>\n",
       "      <td>2021-03-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>54.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>49</td>\n",
       "      <td>AI设计下的智能驾驶场景文本识别技术</td>\n",
       "      <td>梁敏; 秦海波; 覃京燕; 殷绪成</td>\n",
       "      <td>包装工程</td>\n",
       "      <td>2021-03-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>143.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>50</td>\n",
       "      <td>唯物史观论域下人工智能的伦理问题思考与合伦理设计</td>\n",
       "      <td>田鹏颖; 周鑫</td>\n",
       "      <td>宁夏社会科学</td>\n",
       "      <td>2021-03-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>355.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                                                 篇名  \\\n",
       "0            1                            森林生态站大数据快速存储与索引方法  网络首发   \n",
       "1            2  人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》   \n",
       "2            3                                 基于大数据分析的舰船装备寿命测试系统   \n",
       "3            4                               基于大数据与信息技术的拖拉机零部件供应链   \n",
       "4            5                              智能制造和大数据挖掘在农业机械设计中的应用   \n",
       "5            6                               基于特征加权的分布式大数据相关性挖掘方法   \n",
       "6            7                                基于AI的车载智能语音识别报警系统研制   \n",
       "7            8                                   人工智能教育的含义界定与原理挖掘   \n",
       "8            9                                     人工智能应用场景的界定与开发   \n",
       "9           10                 滚刀状态实时诊断技术在超大直径泥水盾构中的应用——以汕头苏埃通道为例   \n",
       "10          11                         近5年图情SSCI期刊人工智能伦理研究文献分析与启示   \n",
       "11          12                     教育信息化2.0背景下省级教育大数据平台建设研究  网络首发   \n",
       "12          13                                大数据挖掘技术的光流场图像匹配方法设计   \n",
       "13          14                                   大数据驱动的船舶航行路径跟踪研究   \n",
       "14          15                                  基于人工智能技术的船舶智能制造系统   \n",
       "15          16        大数据下基于机器学习的项目智能成本管理研究——以A风景园林规划研究院规划设计类项目为例   \n",
       "16          17                            新时期中欧人工智能发展战略与政策环境的比较研究   \n",
       "17          18                             大数据技术视域下智慧图书馆伦理危机与控制研究   \n",
       "18          19                         智能时代的中小学人工智能教育：总体定位与核心内容领域   \n",
       "19          20                              大数据环境下基于谱机器学习的云物流资源配置   \n",
       "20          21                               酶工程：从人工设计到人工智能  网络首发   \n",
       "21          22                           论技术向善何以可能——人工智能教育伦理的逻辑起点   \n",
       "22          23                        基于大数据的产品族本体造型意象挖掘方法研究  网络首发   \n",
       "23          24                             基于智能制造和大数据挖掘的农机数字化设计研究   \n",
       "24          25                                 语义分析及向量化大数据XSS入侵识别   \n",
       "25          26                         智能化学本评估初探——基于AI教师主讲课堂的试验研究   \n",
       "26          27                             大数据平台下化工企业消防安全风险分析指标设计   \n",
       "27          28                        知识牵引与数据驱动的兵棋AI设计及关键技术  网络首发   \n",
       "28          29                                 基于网络舆情大数据的公共政策评价研究   \n",
       "29          30                         基于Mapreduce的多源多模态大数据检索方法研究   \n",
       "30          31   从学习效果和教育公平的角度看高等教育人工智能应用——一项基于多个数据库英文同行评审期刊文献的综述   \n",
       "31          32                                      “城市仿真”大数据平台简介   \n",
       "32          33                              人工智能非主体性前提下侵权责任承担机制研究   \n",
       "33          34                      机用碳纤维/ABS复合材料人工智能辅助成型工艺关键技术研究   \n",
       "34          35                                  城市轨道交通勘测大数据的集成与应用   \n",
       "35          36                                人工智能驱动下智慧养老服务模式构建研究   \n",
       "36          37               电子科技大学周军教授团队在芯片奥林匹克会议ISSCC发表人工智能芯片论文   \n",
       "37          38                             面向重大公共事务决策风险治理的大数据行动框架   \n",
       "38          39                               共智融合的大数据智能化人才培养研究与实践   \n",
       "39          40                        从教学样式到学习范式：人工智能环境下学习的通用设计转化   \n",
       "40          41                人工智能教学中“知识建构、STEM、创客”三位一体教学模型的设计与应用   \n",
       "41          42                                   人工智能环境下广告创意人才的培养   \n",
       "42          43                            基于MapReduce的大数据在线聚集优化设计   \n",
       "43          44                                          航空大数据研究综述   \n",
       "44          45                                  人工智能技术的船舶航行轨迹控制算法   \n",
       "45          46                                   大数据挖掘算法无人船信息管理系统   \n",
       "46          47                                      负责任的人工智能与设计创新   \n",
       "47          48                                     AI设计下的文本视觉问答技术   \n",
       "48          49                                 AI设计下的智能驾驶场景文本识别技术   \n",
       "49          50                           唯物史观论域下人工智能的伦理问题思考与合伦理设计   \n",
       "\n",
       "                         作者             刊名              发表时间   被引      下载  操作  \n",
       "0    王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福         农业机械学报  2021-07-06 09:48  NaN     NaN  下载  \n",
       "1                       张诗雨           锻压技术        2021-06-25  NaN     8.0  下载  \n",
       "2                       化雪荟         舰船科学技术        2021-06-23  NaN     NaN  下载  \n",
       "3                        王弥          农机化研究        2021-06-15  NaN   104.0  下载  \n",
       "4                       杜伯阳          农机化研究        2021-06-15  NaN   186.0  下载  \n",
       "5                  戴惠丽; 王敬宇          计算机仿真        2021-06-15  NaN     NaN  下载  \n",
       "6              苏明; 艾海明; 王东明        传感器与微系统        2021-06-10  NaN   165.0  下载  \n",
       "7                       彭绍东         中国电化教育        2021-06-08  NaN   881.0  下载  \n",
       "8               李梦薇; 徐峰; 高芳         中国科技论坛        2021-06-05  NaN   123.0  下载  \n",
       "9   魏晓龙; 林福龙; 孟祥波; 周树亮; 郭俊可      隧道建设(中英文)  2021-06-01 09:56  NaN    78.0  下载  \n",
       "10        黄崑; 徐晓婷; 黎安润泽; 徐峰           现代情报        2021-06-01  NaN   671.0  下载  \n",
       "11                      汤岭球         当代教育论坛  2021-05-26 18:52  NaN   525.0  下载  \n",
       "12             黄凯宁; 郭有强; 杨静           激光杂志        2021-05-25  NaN    36.0  下载  \n",
       "13                       王冷         舰船科学技术        2021-05-23  NaN     9.0  下载  \n",
       "14                  聂华; 雷开元         舰船科学技术        2021-05-23  NaN    64.0  下载  \n",
       "15             程平; 彭兰雅; 辜榕容           财会通讯        2021-05-20  NaN   234.0  下载  \n",
       "16                  关皓元; 高杰          管理现代化  2021-05-17 15:21  NaN   342.0  下载  \n",
       "17               陆康; 刘慧; 曹畋        高校图书馆工作        2021-05-15  NaN   161.0  下载  \n",
       "18        卢宇; 汤筱玙; 宋佳宸; 余胜泉         中国远程教育        2021-05-12  NaN  1139.0  下载  \n",
       "19                 张人龙; 刘小红          统计与决策  2021-05-10 10:39  NaN   269.0  下载  \n",
       "20      王雅丽;付友思;陈俊宏;黄佳城;廖浪星           化工学报  2021-05-08 14:42  NaN   228.0  下载  \n",
       "21                     孙田琳子           高教探索        2021-05-05  NaN   181.0  下载  \n",
       "22                  王鹏; 朱韦龙           图学学报  2021-04-30 10:50  NaN   185.0  下载  \n",
       "23                  任燕; 崔庚彦          农机化研究        2021-04-28  NaN   238.0  下载  \n",
       "24                 张海军; 陈映辉  南开大学学报(自然科学版)        2021-04-20  NaN    18.0  下载  \n",
       "25            阮婷婷; 黄甫全; 曾文婕        教育研究与实验        2021-04-20  NaN    96.0  下载  \n",
       "26       王滨滨;褚新颖;程诚;王禹寒;胡文倩  南开大学学报(自然科学版)        2021-04-20  NaN    53.0  下载  \n",
       "27     程恺; 陈刚; 余晓晗; 刘满; 邵天浩      系统工程与电子技术  2021-04-19 08:31  NaN   140.0  下载  \n",
       "28         邱尔丽; 张竞; 王雨舟; 曹攀           领导科学        2021-04-16  NaN   216.0  下载  \n",
       "29                 魏秀卓; 赵慧南          计算机仿真        2021-04-15  NaN    71.0  下载  \n",
       "30                  郝丹; 肖俊洪         现代教育技术        2021-04-15  NaN   250.0  下载  \n",
       "31                      NaN    交通运输系统工程与信息        2021-04-15  NaN    44.0  下载  \n",
       "32                      付其运           法学杂志        2021-04-15  NaN   250.0  下载  \n",
       "33                       黄罡         化工新型材料        2021-04-15  NaN    47.0  下载  \n",
       "34         任传斌; 于淼; 李珂; 冯增文           地质论评        2021-04-15  NaN    39.0  下载  \n",
       "35                 赵奕钧; 邓大松           江淮论坛  2021-04-12 10:39  NaN   980.0  下载  \n",
       "36                      NaN         信息网络安全        2021-04-10  NaN    51.0  下载  \n",
       "37            毕凌燕; 张海璇; 左文明         科技管理研究        2021-04-10  NaN    67.0  下载  \n",
       "38          冯永; 钟将; 王茜; 李学明         中国电化教育        2021-04-08  NaN   449.0  下载  \n",
       "39                      杨绪辉         中国电化教育        2021-04-08  NaN   336.0  下载  \n",
       "40                 丁美荣; 王同聚         电化教育研究        2021-04-01  1.0   936.0  下载  \n",
       "41                       赵朴           出版广角        2021-03-30  NaN   110.0  下载  \n",
       "42                       李骏  河北大学学报(自然科学版)        2021-03-25  NaN    21.0  下载  \n",
       "43         赵学武;吴宁;王军;阮利;李玲玲       计算机科学与探索  2021-03-23 16:56  NaN   412.0  下载  \n",
       "44                       殷慧         舰船科学技术        2021-03-23  NaN    60.0  下载  \n",
       "45                       解莹         舰船科学技术        2021-03-23  NaN    46.0  下载  \n",
       "46                  王韫; 徐迎庆           包装工程        2021-03-20  NaN   228.0  下载  \n",
       "47            晋赞霞; 覃京燕; 殷绪成           包装工程        2021-03-20  NaN    54.0  下载  \n",
       "48        梁敏; 秦海波; 覃京燕; 殷绪成           包装工程        2021-03-20  NaN   143.0  下载  \n",
       "49                  田鹏颖; 周鑫         宁夏社会科学        2021-03-20  NaN   355.0  下载  "
      ]
     },
     "execution_count": 61,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 抓取相关的重要信息\n",
    "element = driver.find_element_by_id('gridTable')\n",
    "page_html = element.get_attribute('innerHTML')\n",
    "页面数据 = pd.read_html(page_html)[0]\n",
    "页面数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 62,
   "metadata": {},
   "outputs": [],
   "source": [
    "html = driver.page_source\n",
    "root = fromstring(html)\n",
    "href = [x for x in root.xpath('.//*[@id=\"gridTable\"]/table/tbody/tr/td[2]/a/@href')]\n",
    "\n",
    "def correct(href):\n",
    "    DbCode = re.findall(\"DbCode=(.*?)&\",href)[0]\n",
    "    dbname = re.findall(\"dbname=(.*?)&\",href)[0]\n",
    "    filename = re.findall(\"filename=(.*?)&\",href)[0]\n",
    "    href = f\"https://kns.cnki.net/kcms/detail/detail.aspx?dbcode={DbCode}&dbname={dbname}&filename={filename}\"\n",
    "    return href"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 63,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>森林生态站大数据快速存储与索引方法  网络首发</td>\n",
       "      <td>王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福</td>\n",
       "      <td>农业机械学报</td>\n",
       "      <td>2021-07-06 09:48</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》</td>\n",
       "      <td>张诗雨</td>\n",
       "      <td>锻压技术</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>8.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>基于大数据分析的舰船装备寿命测试系统</td>\n",
       "      <td>化雪荟</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-06-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>基于大数据与信息技术的拖拉机零部件供应链</td>\n",
       "      <td>王弥</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>104.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>智能制造和大数据挖掘在农业机械设计中的应用</td>\n",
       "      <td>杜伯阳</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>186.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>基于特征加权的分布式大数据相关性挖掘方法</td>\n",
       "      <td>戴惠丽; 王敬宇</td>\n",
       "      <td>计算机仿真</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>基于AI的车载智能语音识别报警系统研制</td>\n",
       "      <td>苏明; 艾海明; 王东明</td>\n",
       "      <td>传感器与微系统</td>\n",
       "      <td>2021-06-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>165.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>人工智能教育的含义界定与原理挖掘</td>\n",
       "      <td>彭绍东</td>\n",
       "      <td>中国电化教育</td>\n",
       "      <td>2021-06-08</td>\n",
       "      <td>NaN</td>\n",
       "      <td>881.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>9</td>\n",
       "      <td>人工智能应用场景的界定与开发</td>\n",
       "      <td>李梦薇; 徐峰; 高芳</td>\n",
       "      <td>中国科技论坛</td>\n",
       "      <td>2021-06-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>123.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>10</td>\n",
       "      <td>滚刀状态实时诊断技术在超大直径泥水盾构中的应用——以汕头苏埃通道为例</td>\n",
       "      <td>魏晓龙; 林福龙; 孟祥波; 周树亮; 郭俊可</td>\n",
       "      <td>隧道建设(中英文)</td>\n",
       "      <td>2021-06-01 09:56</td>\n",
       "      <td>NaN</td>\n",
       "      <td>78.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>11</td>\n",
       "      <td>近5年图情SSCI期刊人工智能伦理研究文献分析与启示</td>\n",
       "      <td>黄崑; 徐晓婷; 黎安润泽; 徐峰</td>\n",
       "      <td>现代情报</td>\n",
       "      <td>2021-06-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>671.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>12</td>\n",
       "      <td>教育信息化2.0背景下省级教育大数据平台建设研究  网络首发</td>\n",
       "      <td>汤岭球</td>\n",
       "      <td>当代教育论坛</td>\n",
       "      <td>2021-05-26 18:52</td>\n",
       "      <td>NaN</td>\n",
       "      <td>525.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>13</td>\n",
       "      <td>大数据挖掘技术的光流场图像匹配方法设计</td>\n",
       "      <td>黄凯宁; 郭有强; 杨静</td>\n",
       "      <td>激光杂志</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>36.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>14</td>\n",
       "      <td>大数据驱动的船舶航行路径跟踪研究</td>\n",
       "      <td>王冷</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-05-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>15</td>\n",
       "      <td>基于人工智能技术的船舶智能制造系统</td>\n",
       "      <td>聂华; 雷开元</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-05-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>64.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>16</td>\n",
       "      <td>大数据下基于机器学习的项目智能成本管理研究——以A风景园林规划研究院规划设计类项目为例</td>\n",
       "      <td>程平; 彭兰雅; 辜榕容</td>\n",
       "      <td>财会通讯</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>234.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>17</td>\n",
       "      <td>新时期中欧人工智能发展战略与政策环境的比较研究</td>\n",
       "      <td>关皓元; 高杰</td>\n",
       "      <td>管理现代化</td>\n",
       "      <td>2021-05-17 15:21</td>\n",
       "      <td>NaN</td>\n",
       "      <td>342.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>18</td>\n",
       "      <td>大数据技术视域下智慧图书馆伦理危机与控制研究</td>\n",
       "      <td>陆康; 刘慧; 曹畋</td>\n",
       "      <td>高校图书馆工作</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>161.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>19</td>\n",
       "      <td>智能时代的中小学人工智能教育：总体定位与核心内容领域</td>\n",
       "      <td>卢宇; 汤筱玙; 宋佳宸; 余胜泉</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-05-12</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1139.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>20</td>\n",
       "      <td>大数据环境下基于谱机器学习的云物流资源配置</td>\n",
       "      <td>张人龙; 刘小红</td>\n",
       "      <td>统计与决策</td>\n",
       "      <td>2021-05-10 10:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>269.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>21</td>\n",
       "      <td>酶工程：从人工设计到人工智能  网络首发</td>\n",
       "      <td>王雅丽;付友思;陈俊宏;黄佳城;廖浪星</td>\n",
       "      <td>化工学报</td>\n",
       "      <td>2021-05-08 14:42</td>\n",
       "      <td>NaN</td>\n",
       "      <td>228.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>22</td>\n",
       "      <td>论技术向善何以可能——人工智能教育伦理的逻辑起点</td>\n",
       "      <td>孙田琳子</td>\n",
       "      <td>高教探索</td>\n",
       "      <td>2021-05-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>181.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>23</td>\n",
       "      <td>基于大数据的产品族本体造型意象挖掘方法研究  网络首发</td>\n",
       "      <td>王鹏; 朱韦龙</td>\n",
       "      <td>图学学报</td>\n",
       "      <td>2021-04-30 10:50</td>\n",
       "      <td>NaN</td>\n",
       "      <td>185.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>24</td>\n",
       "      <td>基于智能制造和大数据挖掘的农机数字化设计研究</td>\n",
       "      <td>任燕; 崔庚彦</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2021-04-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>238.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>25</td>\n",
       "      <td>语义分析及向量化大数据XSS入侵识别</td>\n",
       "      <td>张海军; 陈映辉</td>\n",
       "      <td>南开大学学报(自然科学版)</td>\n",
       "      <td>2021-04-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>18.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>26</td>\n",
       "      <td>智能化学本评估初探——基于AI教师主讲课堂的试验研究</td>\n",
       "      <td>阮婷婷; 黄甫全; 曾文婕</td>\n",
       "      <td>教育研究与实验</td>\n",
       "      <td>2021-04-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>96.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>27</td>\n",
       "      <td>大数据平台下化工企业消防安全风险分析指标设计</td>\n",
       "      <td>王滨滨;褚新颖;程诚;王禹寒;胡文倩</td>\n",
       "      <td>南开大学学报(自然科学版)</td>\n",
       "      <td>2021-04-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>53.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>28</td>\n",
       "      <td>知识牵引与数据驱动的兵棋AI设计及关键技术  网络首发</td>\n",
       "      <td>程恺; 陈刚; 余晓晗; 刘满; 邵天浩</td>\n",
       "      <td>系统工程与电子技术</td>\n",
       "      <td>2021-04-19 08:31</td>\n",
       "      <td>NaN</td>\n",
       "      <td>140.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>29</td>\n",
       "      <td>基于网络舆情大数据的公共政策评价研究</td>\n",
       "      <td>邱尔丽; 张竞; 王雨舟; 曹攀</td>\n",
       "      <td>领导科学</td>\n",
       "      <td>2021-04-16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>216.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>30</td>\n",
       "      <td>基于Mapreduce的多源多模态大数据检索方法研究</td>\n",
       "      <td>魏秀卓; 赵慧南</td>\n",
       "      <td>计算机仿真</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>71.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>31</td>\n",
       "      <td>从学习效果和教育公平的角度看高等教育人工智能应用——一项基于多个数据库英文同行评审期刊文献的综述</td>\n",
       "      <td>郝丹; 肖俊洪</td>\n",
       "      <td>现代教育技术</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>250.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>32</td>\n",
       "      <td>“城市仿真”大数据平台简介</td>\n",
       "      <td>NaN</td>\n",
       "      <td>交通运输系统工程与信息</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>44.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>33</td>\n",
       "      <td>人工智能非主体性前提下侵权责任承担机制研究</td>\n",
       "      <td>付其运</td>\n",
       "      <td>法学杂志</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>250.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>34</td>\n",
       "      <td>机用碳纤维/ABS复合材料人工智能辅助成型工艺关键技术研究</td>\n",
       "      <td>黄罡</td>\n",
       "      <td>化工新型材料</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>47.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>35</td>\n",
       "      <td>城市轨道交通勘测大数据的集成与应用</td>\n",
       "      <td>任传斌; 于淼; 李珂; 冯增文</td>\n",
       "      <td>地质论评</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>39.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>36</td>\n",
       "      <td>人工智能驱动下智慧养老服务模式构建研究</td>\n",
       "      <td>赵奕钧; 邓大松</td>\n",
       "      <td>江淮论坛</td>\n",
       "      <td>2021-04-12 10:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>980.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>37</td>\n",
       "      <td>电子科技大学周军教授团队在芯片奥林匹克会议ISSCC发表人工智能芯片论文</td>\n",
       "      <td>NaN</td>\n",
       "      <td>信息网络安全</td>\n",
       "      <td>2021-04-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>51.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>38</td>\n",
       "      <td>面向重大公共事务决策风险治理的大数据行动框架</td>\n",
       "      <td>毕凌燕; 张海璇; 左文明</td>\n",
       "      <td>科技管理研究</td>\n",
       "      <td>2021-04-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>67.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>39</td>\n",
       "      <td>共智融合的大数据智能化人才培养研究与实践</td>\n",
       "      <td>冯永; 钟将; 王茜; 李学明</td>\n",
       "      <td>中国电化教育</td>\n",
       "      <td>2021-04-08</td>\n",
       "      <td>NaN</td>\n",
       "      <td>449.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>40</td>\n",
       "      <td>从教学样式到学习范式：人工智能环境下学习的通用设计转化</td>\n",
       "      <td>杨绪辉</td>\n",
       "      <td>中国电化教育</td>\n",
       "      <td>2021-04-08</td>\n",
       "      <td>NaN</td>\n",
       "      <td>336.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>41</td>\n",
       "      <td>人工智能教学中“知识建构、STEM、创客”三位一体教学模型的设计与应用</td>\n",
       "      <td>丁美荣; 王同聚</td>\n",
       "      <td>电化教育研究</td>\n",
       "      <td>2021-04-01</td>\n",
       "      <td>1.0</td>\n",
       "      <td>936.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>42</td>\n",
       "      <td>人工智能环境下广告创意人才的培养</td>\n",
       "      <td>赵朴</td>\n",
       "      <td>出版广角</td>\n",
       "      <td>2021-03-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>110.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>43</td>\n",
       "      <td>基于MapReduce的大数据在线聚集优化设计</td>\n",
       "      <td>李骏</td>\n",
       "      <td>河北大学学报(自然科学版)</td>\n",
       "      <td>2021-03-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>21.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>44</td>\n",
       "      <td>航空大数据研究综述</td>\n",
       "      <td>赵学武;吴宁;王军;阮利;李玲玲</td>\n",
       "      <td>计算机科学与探索</td>\n",
       "      <td>2021-03-23 16:56</td>\n",
       "      <td>NaN</td>\n",
       "      <td>412.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>45</td>\n",
       "      <td>人工智能技术的船舶航行轨迹控制算法</td>\n",
       "      <td>殷慧</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-03-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>60.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>46</td>\n",
       "      <td>大数据挖掘算法无人船信息管理系统</td>\n",
       "      <td>解莹</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-03-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>46.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>47</td>\n",
       "      <td>负责任的人工智能与设计创新</td>\n",
       "      <td>王韫; 徐迎庆</td>\n",
       "      <td>包装工程</td>\n",
       "      <td>2021-03-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>228.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>48</td>\n",
       "      <td>AI设计下的文本视觉问答技术</td>\n",
       "      <td>晋赞霞; 覃京燕; 殷绪成</td>\n",
       "      <td>包装工程</td>\n",
       "      <td>2021-03-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>54.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>49</td>\n",
       "      <td>AI设计下的智能驾驶场景文本识别技术</td>\n",
       "      <td>梁敏; 秦海波; 覃京燕; 殷绪成</td>\n",
       "      <td>包装工程</td>\n",
       "      <td>2021-03-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>143.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>50</td>\n",
       "      <td>唯物史观论域下人工智能的伦理问题思考与合伦理设计</td>\n",
       "      <td>田鹏颖; 周鑫</td>\n",
       "      <td>宁夏社会科学</td>\n",
       "      <td>2021-03-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>355.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                                                 篇名  \\\n",
       "0            1                            森林生态站大数据快速存储与索引方法  网络首发   \n",
       "1            2  人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》   \n",
       "2            3                                 基于大数据分析的舰船装备寿命测试系统   \n",
       "3            4                               基于大数据与信息技术的拖拉机零部件供应链   \n",
       "4            5                              智能制造和大数据挖掘在农业机械设计中的应用   \n",
       "5            6                               基于特征加权的分布式大数据相关性挖掘方法   \n",
       "6            7                                基于AI的车载智能语音识别报警系统研制   \n",
       "7            8                                   人工智能教育的含义界定与原理挖掘   \n",
       "8            9                                     人工智能应用场景的界定与开发   \n",
       "9           10                 滚刀状态实时诊断技术在超大直径泥水盾构中的应用——以汕头苏埃通道为例   \n",
       "10          11                         近5年图情SSCI期刊人工智能伦理研究文献分析与启示   \n",
       "11          12                     教育信息化2.0背景下省级教育大数据平台建设研究  网络首发   \n",
       "12          13                                大数据挖掘技术的光流场图像匹配方法设计   \n",
       "13          14                                   大数据驱动的船舶航行路径跟踪研究   \n",
       "14          15                                  基于人工智能技术的船舶智能制造系统   \n",
       "15          16        大数据下基于机器学习的项目智能成本管理研究——以A风景园林规划研究院规划设计类项目为例   \n",
       "16          17                            新时期中欧人工智能发展战略与政策环境的比较研究   \n",
       "17          18                             大数据技术视域下智慧图书馆伦理危机与控制研究   \n",
       "18          19                         智能时代的中小学人工智能教育：总体定位与核心内容领域   \n",
       "19          20                              大数据环境下基于谱机器学习的云物流资源配置   \n",
       "20          21                               酶工程：从人工设计到人工智能  网络首发   \n",
       "21          22                           论技术向善何以可能——人工智能教育伦理的逻辑起点   \n",
       "22          23                        基于大数据的产品族本体造型意象挖掘方法研究  网络首发   \n",
       "23          24                             基于智能制造和大数据挖掘的农机数字化设计研究   \n",
       "24          25                                 语义分析及向量化大数据XSS入侵识别   \n",
       "25          26                         智能化学本评估初探——基于AI教师主讲课堂的试验研究   \n",
       "26          27                             大数据平台下化工企业消防安全风险分析指标设计   \n",
       "27          28                        知识牵引与数据驱动的兵棋AI设计及关键技术  网络首发   \n",
       "28          29                                 基于网络舆情大数据的公共政策评价研究   \n",
       "29          30                         基于Mapreduce的多源多模态大数据检索方法研究   \n",
       "30          31   从学习效果和教育公平的角度看高等教育人工智能应用——一项基于多个数据库英文同行评审期刊文献的综述   \n",
       "31          32                                      “城市仿真”大数据平台简介   \n",
       "32          33                              人工智能非主体性前提下侵权责任承担机制研究   \n",
       "33          34                      机用碳纤维/ABS复合材料人工智能辅助成型工艺关键技术研究   \n",
       "34          35                                  城市轨道交通勘测大数据的集成与应用   \n",
       "35          36                                人工智能驱动下智慧养老服务模式构建研究   \n",
       "36          37               电子科技大学周军教授团队在芯片奥林匹克会议ISSCC发表人工智能芯片论文   \n",
       "37          38                             面向重大公共事务决策风险治理的大数据行动框架   \n",
       "38          39                               共智融合的大数据智能化人才培养研究与实践   \n",
       "39          40                        从教学样式到学习范式：人工智能环境下学习的通用设计转化   \n",
       "40          41                人工智能教学中“知识建构、STEM、创客”三位一体教学模型的设计与应用   \n",
       "41          42                                   人工智能环境下广告创意人才的培养   \n",
       "42          43                            基于MapReduce的大数据在线聚集优化设计   \n",
       "43          44                                          航空大数据研究综述   \n",
       "44          45                                  人工智能技术的船舶航行轨迹控制算法   \n",
       "45          46                                   大数据挖掘算法无人船信息管理系统   \n",
       "46          47                                      负责任的人工智能与设计创新   \n",
       "47          48                                     AI设计下的文本视觉问答技术   \n",
       "48          49                                 AI设计下的智能驾驶场景文本识别技术   \n",
       "49          50                           唯物史观论域下人工智能的伦理问题思考与合伦理设计   \n",
       "\n",
       "                         作者             刊名              发表时间   被引      下载  操作  \\\n",
       "0    王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福         农业机械学报  2021-07-06 09:48  NaN     NaN  下载   \n",
       "1                       张诗雨           锻压技术        2021-06-25  NaN     8.0  下载   \n",
       "2                       化雪荟         舰船科学技术        2021-06-23  NaN     NaN  下载   \n",
       "3                        王弥          农机化研究        2021-06-15  NaN   104.0  下载   \n",
       "4                       杜伯阳          农机化研究        2021-06-15  NaN   186.0  下载   \n",
       "5                  戴惠丽; 王敬宇          计算机仿真        2021-06-15  NaN     NaN  下载   \n",
       "6              苏明; 艾海明; 王东明        传感器与微系统        2021-06-10  NaN   165.0  下载   \n",
       "7                       彭绍东         中国电化教育        2021-06-08  NaN   881.0  下载   \n",
       "8               李梦薇; 徐峰; 高芳         中国科技论坛        2021-06-05  NaN   123.0  下载   \n",
       "9   魏晓龙; 林福龙; 孟祥波; 周树亮; 郭俊可      隧道建设(中英文)  2021-06-01 09:56  NaN    78.0  下载   \n",
       "10        黄崑; 徐晓婷; 黎安润泽; 徐峰           现代情报        2021-06-01  NaN   671.0  下载   \n",
       "11                      汤岭球         当代教育论坛  2021-05-26 18:52  NaN   525.0  下载   \n",
       "12             黄凯宁; 郭有强; 杨静           激光杂志        2021-05-25  NaN    36.0  下载   \n",
       "13                       王冷         舰船科学技术        2021-05-23  NaN     9.0  下载   \n",
       "14                  聂华; 雷开元         舰船科学技术        2021-05-23  NaN    64.0  下载   \n",
       "15             程平; 彭兰雅; 辜榕容           财会通讯        2021-05-20  NaN   234.0  下载   \n",
       "16                  关皓元; 高杰          管理现代化  2021-05-17 15:21  NaN   342.0  下载   \n",
       "17               陆康; 刘慧; 曹畋        高校图书馆工作        2021-05-15  NaN   161.0  下载   \n",
       "18        卢宇; 汤筱玙; 宋佳宸; 余胜泉         中国远程教育        2021-05-12  NaN  1139.0  下载   \n",
       "19                 张人龙; 刘小红          统计与决策  2021-05-10 10:39  NaN   269.0  下载   \n",
       "20      王雅丽;付友思;陈俊宏;黄佳城;廖浪星           化工学报  2021-05-08 14:42  NaN   228.0  下载   \n",
       "21                     孙田琳子           高教探索        2021-05-05  NaN   181.0  下载   \n",
       "22                  王鹏; 朱韦龙           图学学报  2021-04-30 10:50  NaN   185.0  下载   \n",
       "23                  任燕; 崔庚彦          农机化研究        2021-04-28  NaN   238.0  下载   \n",
       "24                 张海军; 陈映辉  南开大学学报(自然科学版)        2021-04-20  NaN    18.0  下载   \n",
       "25            阮婷婷; 黄甫全; 曾文婕        教育研究与实验        2021-04-20  NaN    96.0  下载   \n",
       "26       王滨滨;褚新颖;程诚;王禹寒;胡文倩  南开大学学报(自然科学版)        2021-04-20  NaN    53.0  下载   \n",
       "27     程恺; 陈刚; 余晓晗; 刘满; 邵天浩      系统工程与电子技术  2021-04-19 08:31  NaN   140.0  下载   \n",
       "28         邱尔丽; 张竞; 王雨舟; 曹攀           领导科学        2021-04-16  NaN   216.0  下载   \n",
       "29                 魏秀卓; 赵慧南          计算机仿真        2021-04-15  NaN    71.0  下载   \n",
       "30                  郝丹; 肖俊洪         现代教育技术        2021-04-15  NaN   250.0  下载   \n",
       "31                      NaN    交通运输系统工程与信息        2021-04-15  NaN    44.0  下载   \n",
       "32                      付其运           法学杂志        2021-04-15  NaN   250.0  下载   \n",
       "33                       黄罡         化工新型材料        2021-04-15  NaN    47.0  下载   \n",
       "34         任传斌; 于淼; 李珂; 冯增文           地质论评        2021-04-15  NaN    39.0  下载   \n",
       "35                 赵奕钧; 邓大松           江淮论坛  2021-04-12 10:39  NaN   980.0  下载   \n",
       "36                      NaN         信息网络安全        2021-04-10  NaN    51.0  下载   \n",
       "37            毕凌燕; 张海璇; 左文明         科技管理研究        2021-04-10  NaN    67.0  下载   \n",
       "38          冯永; 钟将; 王茜; 李学明         中国电化教育        2021-04-08  NaN   449.0  下载   \n",
       "39                      杨绪辉         中国电化教育        2021-04-08  NaN   336.0  下载   \n",
       "40                 丁美荣; 王同聚         电化教育研究        2021-04-01  1.0   936.0  下载   \n",
       "41                       赵朴           出版广角        2021-03-30  NaN   110.0  下载   \n",
       "42                       李骏  河北大学学报(自然科学版)        2021-03-25  NaN    21.0  下载   \n",
       "43         赵学武;吴宁;王军;阮利;李玲玲       计算机科学与探索  2021-03-23 16:56  NaN   412.0  下载   \n",
       "44                       殷慧         舰船科学技术        2021-03-23  NaN    60.0  下载   \n",
       "45                       解莹         舰船科学技术        2021-03-23  NaN    46.0  下载   \n",
       "46                  王韫; 徐迎庆           包装工程        2021-03-20  NaN   228.0  下载   \n",
       "47            晋赞霞; 覃京燕; 殷绪成           包装工程        2021-03-20  NaN    54.0  下载   \n",
       "48        梁敏; 秦海波; 覃京燕; 殷绪成           包装工程        2021-03-20  NaN   143.0  下载   \n",
       "49                  田鹏颖; 周鑫         宁夏社会科学        2021-03-20  NaN   355.0  下载   \n",
       "\n",
       "                                                详细页链接  \n",
       "0   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "1   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "2   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "3   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "4   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "5   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "6   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "7   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "8   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "9   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "10  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "11  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "12  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "13  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "14  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "15  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "16  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "17  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "18  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "19  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "20  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "21  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "22  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "23  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "24  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "25  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "26  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "27  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "28  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "29  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "30  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "31  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "32  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "33  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "34  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "35  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "36  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "37  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "38  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "39  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "40  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "41  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "42  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "43  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "44  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "45  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "46  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "47  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "48  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "49  https://kns.cnki.net/kcms/detail/detail.aspx?d...  "
      ]
     },
     "execution_count": 63,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "links=[]\n",
    "\n",
    "for link in href:\n",
    "    link=correct(link)\n",
    "    links.append(link)\n",
    "    df_links=pd.DataFrame({'详细页链接':links})\n",
    "    df_页面表格=pd.concat([pd.read_html(page_html)[0],df_links],axis=1)\n",
    "\n",
    "df_页面表格"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 64,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 详细页面中的PDF下载链接\n",
    "from requests_html import HTMLSession\n",
    "import urllib.parse\n",
    "pdf_links=[]\n",
    "for url in links:\n",
    "    session = HTMLSession()\n",
    "    r = session.get(url)\n",
    "    pdf_link_xpath=r.html.xpath('//*[@id=\"pdfDown\"]/@href')[1]\n",
    "    pdf_links.append(pdf_link_xpath)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 65,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['/kcms/download.aspx?filename=phHWmV3RDFWROh2TI12LUZ0cylmU3FGayJzLrVHNRJkaa12VtZUVyQ0S3hDVGRjZEV0V1RVZlNWUMxUeFhXWpdDaKZTVoF3NW1URvcXdmFFZp52VWZmcydTTh9EUOhGasBTbycTNmN3TqdVZHVjS4B1YuF2YU9EU&tablename=CAPJDAY&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=HWmV3RDFWROh2TI12LUZ0cylmU3FGayJzLrVHNRJkaa12VtZUVyQ0S3hDVGRjZEV0V1RVZlNWUMxUe=0TWzQjRItGcxNjb1MXenVkaRV0QlZ2V3xWUDxET3FETHt0SoNESiN3TqdVZHVjS4B1YuF2YU9EUph&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=DTUdnVvdVZ4EEN5FzbWZjaJR2YX90KMtUMGtme4VkQQFldLlzbzwkUFZWO5ZnYCpmTFVEWG5mdmZnQ=0TSzw2SvkFMWRUSSBDc4xWbn9EO2sCeBRFWqVFWzMTOy1WeBR2LQd1MQJFaywURxJ3NXVHMxcDcHV&tablename=CJFDAUTODAY&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=DTUdnVvdVZ4EEN5FzbWZjaJR2YX90KMtUMGtme4VkQQFldLlzbzwkUFZWO5ZnYCpmTFVEWG5mdmZnQ=0TUDJTUUVVd0NHZQdHUkBjSP5kSvNEe2cDWqVFWzMTOy1WeBR2LQd1MQJFaywURxJ3NXVHMxcDcHV&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=GZJdnaz1GdNd0QixGU3gGMxF1b0JjUMVFWMNkMPJEbSRDbLVjMaZ1NlpHelZHeGp1YjBHUnZUYIllR=0zbMZ0TF9SRpdmd3U3MuFHbmpVaCFzVWJFRzFXazYWRnBVMKJHOLNmRWRzK0wmYwR3MrwUbXdUYDh&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=2bnVFV5wENUN1dLFmM3V2ToFGS4tyNupER6lWchV0ZBljMzJXV0N2bKhFTWpmW1MEbVpVSHl1TilUS=0DMTpEe0lGU0EXWT9We5VHTvclUsJVOJZDaiN1RjlkWKl1RJFUSRpVN4JUU5Z1QwRnNzYlRP9UbQJ&tablename=CJFDAUTODAY&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=QJ2bnVFV5wENUN1dLFmM3V2ToFGS4tyNupER6lWchV0ZBljMzJXV0N2bKhFTWpmW1MEbVpVSHl1TilUSK1WQnpXc0NzRYNVUxBHcxIDVsJjYtB1YNV2N1BTciFnUFdmbzUjbxJmeSpVN4JUU5Z1QwRnNzYlRP9Ub&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=rQFeIREVhhVZvljMzoWS2pVeMdkcp9yYpd2KltiNI1kS4JHahZEetdVaMt0RHp2Q39ybLtkQolGdERHTjFXVVBFNXZkMJZ2N18UZsVGVQdFbiVEN2hma1AHNulmUwo3U3dnYiNlYBF2Z5p0TFh1YllVNOpHWtFmU&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=5gERrVjaPJkapFDMNVzQBR2cwgnNKh3KRBFUlV0YxsGaE1mUlpGVPF3SkV1M2VzaoRlS5cGbqRVRzZ0UycFOjNXOmpXeIZDTUpXSHJkah9UVqN3VQ1EWChlY6h2ZwUHUGVmT28kapJUaplUY3omVIR1bpFEZxQ3L&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=uBFWnR2VRVGNWNzV2UXRHdXdwJHNX12YnVkSYd1NGlTe6NVNrlTcVFTcO1UcI9CVsBVeOFFZKVmcVFnVlNWQPZ0aBN0bBt0bOFTUYhTbYRHcMBTbJRzcuhjYo9iYilkVyo2LvBHZ3cHZGZmYT9GOZNHalZGOMNVY&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=uBFWnR2VRVGNWNzV2UXRHdXdwJHNX12YnVkSYd1NGlTe6NVNrlTcVFTcO1UcI9CVsBVeOFFZKVmcVFnVpF1RzRjTup1S5VURadkQkd0KaVETEFXStplZykWMtllZwUkTth0K5hHd0cHZGZmYT9GOZNHalZGOMNVY&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=t9mcOdUQ5AXMv4WVshzRFN3VrJFN69UdwgkbkNEOzl2MSNWM4YEUy9ER39iV2Z1LJZ2Q4J0Vjh3VvNVWI5WYkhnWDVnWIV1LvtiNldzSNRXd3RTbHhUQwEXNPF2TWllYslGS3J0Y2pkSr1kcVlFM0ZWaSBDczQTd&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=t9mcOdUQ5AXMv4WVshzRFN3VrJFN69UdwgkbkNEOzl2MSNWM4YEUy9ER39iV2Z1LJZ2Q4J0Vjh3VvNVWTplTWNXWpRWduZjYxskNB9UM4IkbJhXc25kcykVNKZlaCpnTiVkeIpnU1pkSr1kcVlFM0ZWaSBDczQTd&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=TMNtkeTVlW4MnMFNUevtyTxYjRNRXMT1kVW9ENqh1SFZnWHtCRmJ0TtdVOjRmYKJVMXJ0amxkeoJEb=0TREZjQyQzTkdGSlhEe5E2NiRzTyUUYihEOYlUbPt0M2V1U2ZFV0FlWHFUcJh2Z1EHWJdVRFNzLlV&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=GSvl2b3lDaalVYIJ2LDNHdKt0dKhGbOxGbx5GV1smawVlSHZnN1UVV2F0UmJ2bxdXUhx2YHVmZKtGc=0TUK12Z5pFcRVTSRRWQzBTRrgHSuZlSqhXROplaYdVb3h0cRN1VCF0L2ZlbrkjU3kEdMZXcKZmcTR&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=t1kYvNDNPRDOL9icJRGM3kHd0Y1Z0sSePhkMzEUN4knehVXTPp0NOlDT3Zzc4B3Ky42b0YVVn92SkZ1cwIlc4UDRptUdM5Ge5oXNFhFehdVc01Wbzc3UrBFSPd0Nx0UVzBzRrMXZ1YVZjdjayYjcTRzU4ETaJxWY&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=5gEbzMWbrBjTshmUwVHMMFzVY90QBh3LltyKrYEbTFTZ5gUV5UFdvUWR6ZGbPZkV6VGM5ckTIhEeGhndudkS5IkYZ5kMrJkNWV3a3FXbt92TXpFc18ybQdFbxdGc3RHbwZ3YsNHWzc1cspVViF0UNdlQxNkQ0Q2M&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=wsCWmVHbvoVRLd1KyQmdQVXc0RVM4onR2gDR002Src3MiNWMwZTel1ETyFWc2l2cRNjazJnRppFZhhWeKlEMBVEVYp3TWtEbz0mepF3VolFUQd1brEjNwkEV5kVb0F3YRtmawAlbChmRK9SUEFlM3hkRJZ3Q0ZTZ&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=2RzK0AVShJWbzlENwgnMlZUdqRWc34kTHBzY3h3ZCZ2L6lzLwhUY1Rjet9yR4l0dpBnT41UciNkdXVnRoZ1MwRWW3AFMkJmaxtEcEp3VnNnMJN1MFdFRnNUZo1URGNTZ5oVcGJ0bspFZspWRvIUQ4dWWtdnS2V3V&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=2RzK0AVShJWbzlENwgnMlZUdqRWc34kTHBzY3h3ZCZ2L6lzLwhUY1Rjet9yR4l0dpBnT41UciNkdXVnRzYHeP9ESrlkTktGZx4Uc3gDe6dldCJkU1tEOXtWUGl2KsFUcrADMZFTYrpFZspWRvIUQ4dWWtdnS2V3V&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=uNjUURHNrZGb0N0T4clY0VVVPt0KXhTcFN2Ny1EbyYFUOBzZwYXeoxWc2MWUZJTdxVUeGhnaDZlYxZWS2QjYhlkRrQFcKtWYiBTUYRmY1VTU2kDc2JHdJ52LKB3YnlXRSJXRLl3MxljT0V3YYNjTo9SZ5Z2SnF3S&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=jUURHNrZGb0N0T4clY0VVVPt0KXhTcFN2Ny1EbyYFUOBzZwYXeoxWc2MWUZJTdxVUeGhnaDZlYxZWS=0TTwhUZvFGUyd3Ss5kYOtEWzsWQxYGS0U0ZqV3MONjTyFVN2sWVxljT0V3YYNjTo9SZ5Z2SnF3SuN&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=kRHM04UaXVnQapVUvJjcxgWO1Z1YORDavJ3KNNWMmdEVJhVcwJld3kDWMFEbNplQud3dFlmYkd2RTBFTaRDROh2MsB1aLBjNQdVbwkza3oUS69UMZh2NCpFVzlDb4BTb2EzYpdDOuBTQthjdnplSr1mWQZ1cvYUM&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=HM04UaXVnQapVUvJjcxgWO1Z1YORDavJ3KNNWMmdEVJhVcwJld3kDWMFEbNplQud3dFlmYkd2RTBFT=0TVCF3TydnWMdnSiZ1VUlleRhndwR0RoJUeW9iQppENhZmc3ZEbrBTQthjdnplSr1mWQZ1cvYUMkR&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=ihUS1cWRSR1M59EdKtUO5QjaDBXcoNEUqpWerpGR5dTbKZEOIZnZjJXYlNVMBVWOBpGSjFWTElHbtNHUkhlcUNDSMVEbtFWe2F2LhJVUmd3cQRnNutGb3sidINGNtF0MC1GaxNTUz10NvU0dyV2SXZmQ19GOxkGT&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=ihUS1cWRSR1M59EdKtUO5QjaDBXcoNEUqpWerpGR5dTbKZEOIZnZjJXYlNVMBVWOBpGSjFWTElHbtNHUUZkM4xmTSFWVJhVTVdnS4k0U3NVMMR0blZ0KrllTvZVZUp0K4VHcrNTUz10NvU0dyV2SXZmQ19GOxkGT&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=mFTcr8mRWNFaMF1RTRWOwR1aZlWe1gURVRWcYV2YjR3SQJTc0VkdwdVYqZGdEFUYYVTOHxURlJlWQN2UL9UQBBlN4BTa3cTUidzVXtyM58EWjdmdwRkZrITTxImWF5EUUFXQSJFZ0dVRIJWWCJUNzE0cjZUZyhTO&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=mFTcr8mRWNFaMF1RTRWOwR1aZlWe1gURVRWcYV2YjR3SQJTc0VkdwdVYqZGdEFUYYVTOHxURlJlWQN2Uhl2cpp0UrhjWrYEbCdHTrkXSB9WM3Bne5skNZlne0Vlcw9WM6t2SXlUT0dVRIJWWCJUNzE0cjZUZyhTO&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=FRVOppnUxITNXVFZnl2RLRDb1ImY21URvg3VYlGNaNzSIRzc2V2NlRVNvJ2bEJjaahVaJdHeGJWRq1kVyMDOGlEMoFEdp10ckV3YOpFVINTdtZEe0V0NiREOwllYup2SQZFR5QXe01mb2JGaMRlR0gDMMlzYGN1Y&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=FRVOppnUxITNXVFZnl2RLRDb1ImY21URvg3VYlGNaNzSIRzc2V2NlRVNvJ2bEJjaahVaJdHeGJWRq1kVh5USVFXcmVDayQ1aC5mS0AjemZkMsZVO1EFSSp0bOVHS5IHZXNjMNVEb01mb2JGaMRlR0gDMMlzYGN1Y&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=2lDOzMDZvkUcyp3dXVWeDJXR1REahRHaktUM0QnNsdFOhFEVsZUSSZ3VyQnejR0VGdDbahGcnVnaMBXWiBXS1kXayUzKPZ0Kpx0MwUleEp2NIh3T3tGd0MUW1o2MjVkNnN1aQhETElUNsZXe4pFexRmMadGSvQWU&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=OBzSnt2QJN1MmVmT18kMjlzRaBzbUN2N0hmZRVkWHdWTr40KFp1TWllNItUZjV0MY5GTnJFa51EUmp1YrsyaxRkNVlGNtZjWC9CRBVlaVRTYmRlSPplV0g1Q2I0YCdGWN9WO4gESMdzSERHTCdUSpZjZrxEaLFFV&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=OBzSnt2QJN1MmVmT18kMjlzRaBzbUN2N0hmZRVkWHdWTr40KFp1TWllNItUZjV0MY5GTnJFa51EUmp1YLBDS0VWdGpkSjNmc100b142T3NjTvFldKNVSrQGbGVmSBV2NLlGRCtEZQdzSERHTCdUSpZjZrxEaLFFV&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=OBzSnt2QJN1MmVmT18kMjlzRaBzbUN2N0hmZRVkWHdWTr40KFp1TWllNItUZjV0MY5GTnJFa51EUmp1Y6dnUO1mca5GSW52MI12dihEZCdTZvZEUW90bWRXewEzcwkEVN9WO4gESMdzSERHTCdUSpZjZrxEaLFFV&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=NhmRzoFV31GShdTZN50crMWWK9yLENEbWVXezAXeshURvcGNiBXRyZUTWBFcwQFdF50cxMUYah1QItkZpplMGl2QQ9CcqlnYidlY1QDS0p1YlNEV1N0M5sEd4UXejpHcSJDUNVTc4gHTUt0SyEHatlVUk1WUyRkS&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=NhmRzoFV31GShdTZN50crMWWK9yLENEbWVXezAXeshURvcGNiBXRyZUTWBFcwQFdF50cxMUYah1QItkZUllMykXM08WOnxWMv9GRDZkdWZzNhxmNwR3cEF3cU5WMyI0a4Q1KSVTc4gHTUt0SyEHatlVUk1WUyRkS&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=PN2M5J2NP5GdlpmQVp1bKpHSzVUUQJTSVBXMwdlWSN3RkhkNyJDOit0ZWRDaaNFb3cGZY52UCFHai1WavZzMSpEVWVnYOV3VGpWbzU3Q5MjUFdDVQFWYOllUWBFdWZ3NwoWdONXeKhjMWt0RV52NQVmWx9CMHVEU&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=PN2M5J2NP5GdlpmQVp1bKpHSzVUUQJTSVBXMwdlWSN3RkhkNyJDOit0ZWRDaaNFb3cGZY52UCFHai1WaFhXSBR0K3UXS1ZHV1kEcz8iMTRXbYd0ZZdUcL1mTP92aRt2N3AVY3R2bKhjMWt0RV52NQVmWx9CMHVEU&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=1cjdyZzd1YnNzkVcIdjZ2dzK3hnNF5mRyxkYysmRTdXOiVEWItSNZljYT1mZP5WY2llWwhFTilUT3dVbFJ2Z4dTdS52b49kchBlQuhHOQhXc3ZFbVdHUKdmQPl2VzZXQTN2Rjl3dNJVe2FTWkdTT30meB9COvU3c&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=1cjdyZzd1YnNzkVcIdjZ2dzK3hnNF5mRyxkYysmRTdXOiVEWItSNZljYT1mZP5WY2llWwhFTilUT3dVbSJ2Z4dTdS52b49kchBlQuhHOQhXc3ZFbVdHUKdmQPl2VzZXQTN2Rjl3dNJVe2FTWkdTT30meB9COvU3c&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=hZ1VhhGUPJHaroVO3J3Nw12QRdVdUpHO4lnVIFDa5UFTnZ0SFFGTDRTc3Y1Rw1mcElkVwlERCR1cZhEcENjSTJWVEpFODZFNNJmW1pEU2gTbzA1LmhVb50EOnlEZw5UTVl1T3ona5UFZZdjarBVR0FXSV5WZ4FkM&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=hZ1VhhGUPJHaroVO3J3Nw12QRdVdUpHO4lnVIFDa5UFTnZ0SFFGTDRTc3Y1Rw1mcElkVwlERCR1cZhEcp1WbtZETyglU5pWQsp1LEVFaL12VT5GOwJ0czRlVrJ0QPBlMLNHRNdFc5UFZZdjarBVR0FXSV5WZ4FkM&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=ih3TJhFaw5WUwRlVlBDUQ1mUYpUVU9UVkh3ZBJDePVEaZBXVZFFWyd0N4YXe4YTZyllMLR3djxmZzp2cpFzSztkMm9iV0NVRMlkeU9CTnlVbHJEdHZ3cSV2YrI1aPBHbK9UbRdjT5UHUnxWeBRnMCljUiBjbxFla&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=ih3TJhFaw5WUwRlVlBDUQ1mUYpUVU9UVkh3ZBJDePVEaZBXVZFFWyd0N4YXe4YTZyllMLR3djxmZzp2cMVmQ4I1STdXbsp0YO5mbPpWePV2MrAleQZnR1ITWDFjVS12cyI2RuVDW5UHUnxWeBRnMCljUiBjbxFla&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=IBzU6ZDRvI0VtJ1bulEbGJVNhFDMKpkUqZVVRp1Z3l1K3YEardGaZN1ZiFXUwg1SzVWUhV2ZEV0SVVld5RUbUNTbSlVMqRXMPlUM01EbD9WMDl2bhhnUQBTaSpUQvIjWxUHUnB1dqdkSRtyVEZFTLdlW20WQJRUM&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=P1kTRVTe4wkcrgEZSZ2dZhndxAFehJXZ2hlWjlFZDdWVOJzRJtCO0JnZXtkVrEmeU5GTpdlWkdVcvVkeMJ0UM12axcDaR1Eb3IzLZFHTBhFO0l2cQNUSwZTTwFlQ2l1N25GWDZTNoNke3BzV2U0ZvVGdod0L5RXZ&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=P1kTRVTe4wkcrgEZSZ2dZhndxAFehJXZ2hlWjlFZDdWVOJzRJtCO0JnZXtkVrEmeU5GTpdlWkdVcvVkeHRGOHdnQNJ3dOlUYQFlbGNEbqhGWiJWb5smc0tWTwFlQ2l1N25GWDZTNoNke3BzV2U0ZvVGdod0L5RXZ&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=uN0VKF1KRFWRsdmThFVZVlmQnhGaGhle1sUUXBVOtNDSuh0apl3KzlnaxhWdzgjR3NVRFhkU3hGZRd2QQV2NLZjTFZ3MyVDOUVnMiFXWrAjarIFcmJTZ1F1MopldIFEOWh2QJNkNv1GUzdld6NEbKBXNulmZyplN&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=uN0VKF1KRFWRsdmThFVZVlmQnhGaGhle1sUUXBVOtNDSuh0apl3KzlnaxhWdzgjR3NVRFhkU3hGZRd2Qp52MPZjTFZ3MyVDOUVnMiFXWrAjarIFcmJTZ1F1MopldIFEOWh2QJNkNv1GUzdld6NEbKBXNulmZyplN&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=1Y2ZI9mSz9UZtFXWxhjcSFGOHhDMkhkUkJFe2VkYnt2YUhFTvEDNrhFcWNXOFNzRuhTSENnSYJUSsJlRSlnV3AHU1glY2M0aatiQ0Q0dFJmV6dnRCFzTHdHSv8ySERDVzZ0dz12M1ZHVsR3KKpncNBnQwImcKxkd&tablename=CJFDLAST2021&dflag=pdfdown']"
      ]
     },
     "execution_count": 65,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pdf_links"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 66,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['https://kns.cnki.net/kcms/download.aspx?filename=phHWmV3RDFWROh2TI12LUZ0cylmU3FGayJzLrVHNRJkaa12VtZUVyQ0S3hDVGRjZEV0V1RVZlNWUMxUeFhXWpdDaKZTVoF3NW1URvcXdmFFZp52VWZmcydTTh9EUOhGasBTbycTNmN3TqdVZHVjS4B1YuF2YU9EU&tablename=CAPJDAY&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=HWmV3RDFWROh2TI12LUZ0cylmU3FGayJzLrVHNRJkaa12VtZUVyQ0S3hDVGRjZEV0V1RVZlNWUMxUe=0TWzQjRItGcxNjb1MXenVkaRV0QlZ2V3xWUDxET3FETHt0SoNESiN3TqdVZHVjS4B1YuF2YU9EUph&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=DTUdnVvdVZ4EEN5FzbWZjaJR2YX90KMtUMGtme4VkQQFldLlzbzwkUFZWO5ZnYCpmTFVEWG5mdmZnQ=0TSzw2SvkFMWRUSSBDc4xWbn9EO2sCeBRFWqVFWzMTOy1WeBR2LQd1MQJFaywURxJ3NXVHMxcDcHV&tablename=CJFDAUTODAY&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=DTUdnVvdVZ4EEN5FzbWZjaJR2YX90KMtUMGtme4VkQQFldLlzbzwkUFZWO5ZnYCpmTFVEWG5mdmZnQ=0TUDJTUUVVd0NHZQdHUkBjSP5kSvNEe2cDWqVFWzMTOy1WeBR2LQd1MQJFaywURxJ3NXVHMxcDcHV&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=GZJdnaz1GdNd0QixGU3gGMxF1b0JjUMVFWMNkMPJEbSRDbLVjMaZ1NlpHelZHeGp1YjBHUnZUYIllR=0zbMZ0TF9SRpdmd3U3MuFHbmpVaCFzVWJFRzFXazYWRnBVMKJHOLNmRWRzK0wmYwR3MrwUbXdUYDh&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=2bnVFV5wENUN1dLFmM3V2ToFGS4tyNupER6lWchV0ZBljMzJXV0N2bKhFTWpmW1MEbVpVSHl1TilUS=0DMTpEe0lGU0EXWT9We5VHTvclUsJVOJZDaiN1RjlkWKl1RJFUSRpVN4JUU5Z1QwRnNzYlRP9UbQJ&tablename=CJFDAUTODAY&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=QJ2bnVFV5wENUN1dLFmM3V2ToFGS4tyNupER6lWchV0ZBljMzJXV0N2bKhFTWpmW1MEbVpVSHl1TilUSK1WQnpXc0NzRYNVUxBHcxIDVsJjYtB1YNV2N1BTciFnUFdmbzUjbxJmeSpVN4JUU5Z1QwRnNzYlRP9Ub&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=rQFeIREVhhVZvljMzoWS2pVeMdkcp9yYpd2KltiNI1kS4JHahZEetdVaMt0RHp2Q39ybLtkQolGdERHTjFXVVBFNXZkMJZ2N18UZsVGVQdFbiVEN2hma1AHNulmUwo3U3dnYiNlYBF2Z5p0TFh1YllVNOpHWtFmU&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=5gERrVjaPJkapFDMNVzQBR2cwgnNKh3KRBFUlV0YxsGaE1mUlpGVPF3SkV1M2VzaoRlS5cGbqRVRzZ0UycFOjNXOmpXeIZDTUpXSHJkah9UVqN3VQ1EWChlY6h2ZwUHUGVmT28kapJUaplUY3omVIR1bpFEZxQ3L&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=uBFWnR2VRVGNWNzV2UXRHdXdwJHNX12YnVkSYd1NGlTe6NVNrlTcVFTcO1UcI9CVsBVeOFFZKVmcVFnVlNWQPZ0aBN0bBt0bOFTUYhTbYRHcMBTbJRzcuhjYo9iYilkVyo2LvBHZ3cHZGZmYT9GOZNHalZGOMNVY&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=uBFWnR2VRVGNWNzV2UXRHdXdwJHNX12YnVkSYd1NGlTe6NVNrlTcVFTcO1UcI9CVsBVeOFFZKVmcVFnVpF1RzRjTup1S5VURadkQkd0KaVETEFXStplZykWMtllZwUkTth0K5hHd0cHZGZmYT9GOZNHalZGOMNVY&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=t9mcOdUQ5AXMv4WVshzRFN3VrJFN69UdwgkbkNEOzl2MSNWM4YEUy9ER39iV2Z1LJZ2Q4J0Vjh3VvNVWI5WYkhnWDVnWIV1LvtiNldzSNRXd3RTbHhUQwEXNPF2TWllYslGS3J0Y2pkSr1kcVlFM0ZWaSBDczQTd&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=t9mcOdUQ5AXMv4WVshzRFN3VrJFN69UdwgkbkNEOzl2MSNWM4YEUy9ER39iV2Z1LJZ2Q4J0Vjh3VvNVWTplTWNXWpRWduZjYxskNB9UM4IkbJhXc25kcykVNKZlaCpnTiVkeIpnU1pkSr1kcVlFM0ZWaSBDczQTd&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=TMNtkeTVlW4MnMFNUevtyTxYjRNRXMT1kVW9ENqh1SFZnWHtCRmJ0TtdVOjRmYKJVMXJ0amxkeoJEb=0TREZjQyQzTkdGSlhEe5E2NiRzTyUUYihEOYlUbPt0M2V1U2ZFV0FlWHFUcJh2Z1EHWJdVRFNzLlV&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=GSvl2b3lDaalVYIJ2LDNHdKt0dKhGbOxGbx5GV1smawVlSHZnN1UVV2F0UmJ2bxdXUhx2YHVmZKtGc=0TUK12Z5pFcRVTSRRWQzBTRrgHSuZlSqhXROplaYdVb3h0cRN1VCF0L2ZlbrkjU3kEdMZXcKZmcTR&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=t1kYvNDNPRDOL9icJRGM3kHd0Y1Z0sSePhkMzEUN4knehVXTPp0NOlDT3Zzc4B3Ky42b0YVVn92SkZ1cwIlc4UDRptUdM5Ge5oXNFhFehdVc01Wbzc3UrBFSPd0Nx0UVzBzRrMXZ1YVZjdjayYjcTRzU4ETaJxWY&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=5gEbzMWbrBjTshmUwVHMMFzVY90QBh3LltyKrYEbTFTZ5gUV5UFdvUWR6ZGbPZkV6VGM5ckTIhEeGhndudkS5IkYZ5kMrJkNWV3a3FXbt92TXpFc18ybQdFbxdGc3RHbwZ3YsNHWzc1cspVViF0UNdlQxNkQ0Q2M&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=wsCWmVHbvoVRLd1KyQmdQVXc0RVM4onR2gDR002Src3MiNWMwZTel1ETyFWc2l2cRNjazJnRppFZhhWeKlEMBVEVYp3TWtEbz0mepF3VolFUQd1brEjNwkEV5kVb0F3YRtmawAlbChmRK9SUEFlM3hkRJZ3Q0ZTZ&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=2RzK0AVShJWbzlENwgnMlZUdqRWc34kTHBzY3h3ZCZ2L6lzLwhUY1Rjet9yR4l0dpBnT41UciNkdXVnRoZ1MwRWW3AFMkJmaxtEcEp3VnNnMJN1MFdFRnNUZo1URGNTZ5oVcGJ0bspFZspWRvIUQ4dWWtdnS2V3V&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=2RzK0AVShJWbzlENwgnMlZUdqRWc34kTHBzY3h3ZCZ2L6lzLwhUY1Rjet9yR4l0dpBnT41UciNkdXVnRzYHeP9ESrlkTktGZx4Uc3gDe6dldCJkU1tEOXtWUGl2KsFUcrADMZFTYrpFZspWRvIUQ4dWWtdnS2V3V&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=uNjUURHNrZGb0N0T4clY0VVVPt0KXhTcFN2Ny1EbyYFUOBzZwYXeoxWc2MWUZJTdxVUeGhnaDZlYxZWS2QjYhlkRrQFcKtWYiBTUYRmY1VTU2kDc2JHdJ52LKB3YnlXRSJXRLl3MxljT0V3YYNjTo9SZ5Z2SnF3S&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=jUURHNrZGb0N0T4clY0VVVPt0KXhTcFN2Ny1EbyYFUOBzZwYXeoxWc2MWUZJTdxVUeGhnaDZlYxZWS=0TTwhUZvFGUyd3Ss5kYOtEWzsWQxYGS0U0ZqV3MONjTyFVN2sWVxljT0V3YYNjTo9SZ5Z2SnF3SuN&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=kRHM04UaXVnQapVUvJjcxgWO1Z1YORDavJ3KNNWMmdEVJhVcwJld3kDWMFEbNplQud3dFlmYkd2RTBFTaRDROh2MsB1aLBjNQdVbwkza3oUS69UMZh2NCpFVzlDb4BTb2EzYpdDOuBTQthjdnplSr1mWQZ1cvYUM&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=HM04UaXVnQapVUvJjcxgWO1Z1YORDavJ3KNNWMmdEVJhVcwJld3kDWMFEbNplQud3dFlmYkd2RTBFT=0TVCF3TydnWMdnSiZ1VUlleRhndwR0RoJUeW9iQppENhZmc3ZEbrBTQthjdnplSr1mWQZ1cvYUMkR&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=ihUS1cWRSR1M59EdKtUO5QjaDBXcoNEUqpWerpGR5dTbKZEOIZnZjJXYlNVMBVWOBpGSjFWTElHbtNHUkhlcUNDSMVEbtFWe2F2LhJVUmd3cQRnNutGb3sidINGNtF0MC1GaxNTUz10NvU0dyV2SXZmQ19GOxkGT&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=ihUS1cWRSR1M59EdKtUO5QjaDBXcoNEUqpWerpGR5dTbKZEOIZnZjJXYlNVMBVWOBpGSjFWTElHbtNHUUZkM4xmTSFWVJhVTVdnS4k0U3NVMMR0blZ0KrllTvZVZUp0K4VHcrNTUz10NvU0dyV2SXZmQ19GOxkGT&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=mFTcr8mRWNFaMF1RTRWOwR1aZlWe1gURVRWcYV2YjR3SQJTc0VkdwdVYqZGdEFUYYVTOHxURlJlWQN2UL9UQBBlN4BTa3cTUidzVXtyM58EWjdmdwRkZrITTxImWF5EUUFXQSJFZ0dVRIJWWCJUNzE0cjZUZyhTO&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=mFTcr8mRWNFaMF1RTRWOwR1aZlWe1gURVRWcYV2YjR3SQJTc0VkdwdVYqZGdEFUYYVTOHxURlJlWQN2Uhl2cpp0UrhjWrYEbCdHTrkXSB9WM3Bne5skNZlne0Vlcw9WM6t2SXlUT0dVRIJWWCJUNzE0cjZUZyhTO&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=FRVOppnUxITNXVFZnl2RLRDb1ImY21URvg3VYlGNaNzSIRzc2V2NlRVNvJ2bEJjaahVaJdHeGJWRq1kVyMDOGlEMoFEdp10ckV3YOpFVINTdtZEe0V0NiREOwllYup2SQZFR5QXe01mb2JGaMRlR0gDMMlzYGN1Y&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=FRVOppnUxITNXVFZnl2RLRDb1ImY21URvg3VYlGNaNzSIRzc2V2NlRVNvJ2bEJjaahVaJdHeGJWRq1kVh5USVFXcmVDayQ1aC5mS0AjemZkMsZVO1EFSSp0bOVHS5IHZXNjMNVEb01mb2JGaMRlR0gDMMlzYGN1Y&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=2lDOzMDZvkUcyp3dXVWeDJXR1REahRHaktUM0QnNsdFOhFEVsZUSSZ3VyQnejR0VGdDbahGcnVnaMBXWiBXS1kXayUzKPZ0Kpx0MwUleEp2NIh3T3tGd0MUW1o2MjVkNnN1aQhETElUNsZXe4pFexRmMadGSvQWU&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=OBzSnt2QJN1MmVmT18kMjlzRaBzbUN2N0hmZRVkWHdWTr40KFp1TWllNItUZjV0MY5GTnJFa51EUmp1YrsyaxRkNVlGNtZjWC9CRBVlaVRTYmRlSPplV0g1Q2I0YCdGWN9WO4gESMdzSERHTCdUSpZjZrxEaLFFV&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=OBzSnt2QJN1MmVmT18kMjlzRaBzbUN2N0hmZRVkWHdWTr40KFp1TWllNItUZjV0MY5GTnJFa51EUmp1YLBDS0VWdGpkSjNmc100b142T3NjTvFldKNVSrQGbGVmSBV2NLlGRCtEZQdzSERHTCdUSpZjZrxEaLFFV&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=OBzSnt2QJN1MmVmT18kMjlzRaBzbUN2N0hmZRVkWHdWTr40KFp1TWllNItUZjV0MY5GTnJFa51EUmp1Y6dnUO1mca5GSW52MI12dihEZCdTZvZEUW90bWRXewEzcwkEVN9WO4gESMdzSERHTCdUSpZjZrxEaLFFV&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=NhmRzoFV31GShdTZN50crMWWK9yLENEbWVXezAXeshURvcGNiBXRyZUTWBFcwQFdF50cxMUYah1QItkZpplMGl2QQ9CcqlnYidlY1QDS0p1YlNEV1N0M5sEd4UXejpHcSJDUNVTc4gHTUt0SyEHatlVUk1WUyRkS&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=NhmRzoFV31GShdTZN50crMWWK9yLENEbWVXezAXeshURvcGNiBXRyZUTWBFcwQFdF50cxMUYah1QItkZUllMykXM08WOnxWMv9GRDZkdWZzNhxmNwR3cEF3cU5WMyI0a4Q1KSVTc4gHTUt0SyEHatlVUk1WUyRkS&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=PN2M5J2NP5GdlpmQVp1bKpHSzVUUQJTSVBXMwdlWSN3RkhkNyJDOit0ZWRDaaNFb3cGZY52UCFHai1WavZzMSpEVWVnYOV3VGpWbzU3Q5MjUFdDVQFWYOllUWBFdWZ3NwoWdONXeKhjMWt0RV52NQVmWx9CMHVEU&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=PN2M5J2NP5GdlpmQVp1bKpHSzVUUQJTSVBXMwdlWSN3RkhkNyJDOit0ZWRDaaNFb3cGZY52UCFHai1WaFhXSBR0K3UXS1ZHV1kEcz8iMTRXbYd0ZZdUcL1mTP92aRt2N3AVY3R2bKhjMWt0RV52NQVmWx9CMHVEU&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=1cjdyZzd1YnNzkVcIdjZ2dzK3hnNF5mRyxkYysmRTdXOiVEWItSNZljYT1mZP5WY2llWwhFTilUT3dVbFJ2Z4dTdS52b49kchBlQuhHOQhXc3ZFbVdHUKdmQPl2VzZXQTN2Rjl3dNJVe2FTWkdTT30meB9COvU3c&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=1cjdyZzd1YnNzkVcIdjZ2dzK3hnNF5mRyxkYysmRTdXOiVEWItSNZljYT1mZP5WY2llWwhFTilUT3dVbSJ2Z4dTdS52b49kchBlQuhHOQhXc3ZFbVdHUKdmQPl2VzZXQTN2Rjl3dNJVe2FTWkdTT30meB9COvU3c&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=hZ1VhhGUPJHaroVO3J3Nw12QRdVdUpHO4lnVIFDa5UFTnZ0SFFGTDRTc3Y1Rw1mcElkVwlERCR1cZhEcENjSTJWVEpFODZFNNJmW1pEU2gTbzA1LmhVb50EOnlEZw5UTVl1T3ona5UFZZdjarBVR0FXSV5WZ4FkM&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=hZ1VhhGUPJHaroVO3J3Nw12QRdVdUpHO4lnVIFDa5UFTnZ0SFFGTDRTc3Y1Rw1mcElkVwlERCR1cZhEcp1WbtZETyglU5pWQsp1LEVFaL12VT5GOwJ0czRlVrJ0QPBlMLNHRNdFc5UFZZdjarBVR0FXSV5WZ4FkM&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=ih3TJhFaw5WUwRlVlBDUQ1mUYpUVU9UVkh3ZBJDePVEaZBXVZFFWyd0N4YXe4YTZyllMLR3djxmZzp2cpFzSztkMm9iV0NVRMlkeU9CTnlVbHJEdHZ3cSV2YrI1aPBHbK9UbRdjT5UHUnxWeBRnMCljUiBjbxFla&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=ih3TJhFaw5WUwRlVlBDUQ1mUYpUVU9UVkh3ZBJDePVEaZBXVZFFWyd0N4YXe4YTZyllMLR3djxmZzp2cMVmQ4I1STdXbsp0YO5mbPpWePV2MrAleQZnR1ITWDFjVS12cyI2RuVDW5UHUnxWeBRnMCljUiBjbxFla&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=IBzU6ZDRvI0VtJ1bulEbGJVNhFDMKpkUqZVVRp1Z3l1K3YEardGaZN1ZiFXUwg1SzVWUhV2ZEV0SVVld5RUbUNTbSlVMqRXMPlUM01EbD9WMDl2bhhnUQBTaSpUQvIjWxUHUnB1dqdkSRtyVEZFTLdlW20WQJRUM&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=P1kTRVTe4wkcrgEZSZ2dZhndxAFehJXZ2hlWjlFZDdWVOJzRJtCO0JnZXtkVrEmeU5GTpdlWkdVcvVkeMJ0UM12axcDaR1Eb3IzLZFHTBhFO0l2cQNUSwZTTwFlQ2l1N25GWDZTNoNke3BzV2U0ZvVGdod0L5RXZ&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=P1kTRVTe4wkcrgEZSZ2dZhndxAFehJXZ2hlWjlFZDdWVOJzRJtCO0JnZXtkVrEmeU5GTpdlWkdVcvVkeHRGOHdnQNJ3dOlUYQFlbGNEbqhGWiJWb5smc0tWTwFlQ2l1N25GWDZTNoNke3BzV2U0ZvVGdod0L5RXZ&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=uN0VKF1KRFWRsdmThFVZVlmQnhGaGhle1sUUXBVOtNDSuh0apl3KzlnaxhWdzgjR3NVRFhkU3hGZRd2QQV2NLZjTFZ3MyVDOUVnMiFXWrAjarIFcmJTZ1F1MopldIFEOWh2QJNkNv1GUzdld6NEbKBXNulmZyplN&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=uN0VKF1KRFWRsdmThFVZVlmQnhGaGhle1sUUXBVOtNDSuh0apl3KzlnaxhWdzgjR3NVRFhkU3hGZRd2Qp52MPZjTFZ3MyVDOUVnMiFXWrAjarIFcmJTZ1F1MopldIFEOWh2QJNkNv1GUzdld6NEbKBXNulmZyplN&tablename=CJFDLAST2021&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=1Y2ZI9mSz9UZtFXWxhjcSFGOHhDMkhkUkJFe2VkYnt2YUhFTvEDNrhFcWNXOFNzRuhTSENnSYJUSsJlRSlnV3AHU1glY2M0aatiQ0Q0dFJmV6dnRCFzTHdHSv8ySERDVzZ0dz12M1ZHVsR3KKpncNBnQwImcKxkd&tablename=CJFDLAST2021&dflag=pdfdown']"
      ]
     },
     "execution_count": 66,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 修复正确的PDF下载链接\n",
    "pdf_href=['https://kns.cnki.net'+link for link in pdf_links]\n",
    "pdf_href"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 67,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>森林生态站大数据快速存储与索引方法  网络首发</td>\n",
       "      <td>王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福</td>\n",
       "      <td>农业机械学报</td>\n",
       "      <td>2021-07-06 09:48</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》</td>\n",
       "      <td>张诗雨</td>\n",
       "      <td>锻压技术</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>8.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>基于大数据分析的舰船装备寿命测试系统</td>\n",
       "      <td>化雪荟</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-06-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>基于大数据与信息技术的拖拉机零部件供应链</td>\n",
       "      <td>王弥</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>104.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>智能制造和大数据挖掘在农业机械设计中的应用</td>\n",
       "      <td>杜伯阳</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>186.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>基于特征加权的分布式大数据相关性挖掘方法</td>\n",
       "      <td>戴惠丽; 王敬宇</td>\n",
       "      <td>计算机仿真</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>基于AI的车载智能语音识别报警系统研制</td>\n",
       "      <td>苏明; 艾海明; 王东明</td>\n",
       "      <td>传感器与微系统</td>\n",
       "      <td>2021-06-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>165.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>人工智能教育的含义界定与原理挖掘</td>\n",
       "      <td>彭绍东</td>\n",
       "      <td>中国电化教育</td>\n",
       "      <td>2021-06-08</td>\n",
       "      <td>NaN</td>\n",
       "      <td>881.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>9</td>\n",
       "      <td>人工智能应用场景的界定与开发</td>\n",
       "      <td>李梦薇; 徐峰; 高芳</td>\n",
       "      <td>中国科技论坛</td>\n",
       "      <td>2021-06-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>123.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>10</td>\n",
       "      <td>滚刀状态实时诊断技术在超大直径泥水盾构中的应用——以汕头苏埃通道为例</td>\n",
       "      <td>魏晓龙; 林福龙; 孟祥波; 周树亮; 郭俊可</td>\n",
       "      <td>隧道建设(中英文)</td>\n",
       "      <td>2021-06-01 09:56</td>\n",
       "      <td>NaN</td>\n",
       "      <td>78.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>11</td>\n",
       "      <td>近5年图情SSCI期刊人工智能伦理研究文献分析与启示</td>\n",
       "      <td>黄崑; 徐晓婷; 黎安润泽; 徐峰</td>\n",
       "      <td>现代情报</td>\n",
       "      <td>2021-06-01</td>\n",
       "      <td>NaN</td>\n",
       "      <td>671.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>12</td>\n",
       "      <td>教育信息化2.0背景下省级教育大数据平台建设研究  网络首发</td>\n",
       "      <td>汤岭球</td>\n",
       "      <td>当代教育论坛</td>\n",
       "      <td>2021-05-26 18:52</td>\n",
       "      <td>NaN</td>\n",
       "      <td>525.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>13</td>\n",
       "      <td>大数据挖掘技术的光流场图像匹配方法设计</td>\n",
       "      <td>黄凯宁; 郭有强; 杨静</td>\n",
       "      <td>激光杂志</td>\n",
       "      <td>2021-05-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>36.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>14</td>\n",
       "      <td>大数据驱动的船舶航行路径跟踪研究</td>\n",
       "      <td>王冷</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-05-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>15</td>\n",
       "      <td>基于人工智能技术的船舶智能制造系统</td>\n",
       "      <td>聂华; 雷开元</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-05-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>64.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>16</td>\n",
       "      <td>大数据下基于机器学习的项目智能成本管理研究——以A风景园林规划研究院规划设计类项目为例</td>\n",
       "      <td>程平; 彭兰雅; 辜榕容</td>\n",
       "      <td>财会通讯</td>\n",
       "      <td>2021-05-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>234.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>17</td>\n",
       "      <td>新时期中欧人工智能发展战略与政策环境的比较研究</td>\n",
       "      <td>关皓元; 高杰</td>\n",
       "      <td>管理现代化</td>\n",
       "      <td>2021-05-17 15:21</td>\n",
       "      <td>NaN</td>\n",
       "      <td>342.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>18</td>\n",
       "      <td>大数据技术视域下智慧图书馆伦理危机与控制研究</td>\n",
       "      <td>陆康; 刘慧; 曹畋</td>\n",
       "      <td>高校图书馆工作</td>\n",
       "      <td>2021-05-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>161.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>19</td>\n",
       "      <td>智能时代的中小学人工智能教育：总体定位与核心内容领域</td>\n",
       "      <td>卢宇; 汤筱玙; 宋佳宸; 余胜泉</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-05-12</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1139.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>20</td>\n",
       "      <td>大数据环境下基于谱机器学习的云物流资源配置</td>\n",
       "      <td>张人龙; 刘小红</td>\n",
       "      <td>统计与决策</td>\n",
       "      <td>2021-05-10 10:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>269.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>21</td>\n",
       "      <td>酶工程：从人工设计到人工智能  网络首发</td>\n",
       "      <td>王雅丽;付友思;陈俊宏;黄佳城;廖浪星</td>\n",
       "      <td>化工学报</td>\n",
       "      <td>2021-05-08 14:42</td>\n",
       "      <td>NaN</td>\n",
       "      <td>228.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>22</td>\n",
       "      <td>论技术向善何以可能——人工智能教育伦理的逻辑起点</td>\n",
       "      <td>孙田琳子</td>\n",
       "      <td>高教探索</td>\n",
       "      <td>2021-05-05</td>\n",
       "      <td>NaN</td>\n",
       "      <td>181.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>23</td>\n",
       "      <td>基于大数据的产品族本体造型意象挖掘方法研究  网络首发</td>\n",
       "      <td>王鹏; 朱韦龙</td>\n",
       "      <td>图学学报</td>\n",
       "      <td>2021-04-30 10:50</td>\n",
       "      <td>NaN</td>\n",
       "      <td>185.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>24</td>\n",
       "      <td>基于智能制造和大数据挖掘的农机数字化设计研究</td>\n",
       "      <td>任燕; 崔庚彦</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2021-04-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>238.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>25</td>\n",
       "      <td>语义分析及向量化大数据XSS入侵识别</td>\n",
       "      <td>张海军; 陈映辉</td>\n",
       "      <td>南开大学学报(自然科学版)</td>\n",
       "      <td>2021-04-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>18.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>26</td>\n",
       "      <td>智能化学本评估初探——基于AI教师主讲课堂的试验研究</td>\n",
       "      <td>阮婷婷; 黄甫全; 曾文婕</td>\n",
       "      <td>教育研究与实验</td>\n",
       "      <td>2021-04-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>96.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>27</td>\n",
       "      <td>大数据平台下化工企业消防安全风险分析指标设计</td>\n",
       "      <td>王滨滨;褚新颖;程诚;王禹寒;胡文倩</td>\n",
       "      <td>南开大学学报(自然科学版)</td>\n",
       "      <td>2021-04-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>53.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>28</td>\n",
       "      <td>知识牵引与数据驱动的兵棋AI设计及关键技术  网络首发</td>\n",
       "      <td>程恺; 陈刚; 余晓晗; 刘满; 邵天浩</td>\n",
       "      <td>系统工程与电子技术</td>\n",
       "      <td>2021-04-19 08:31</td>\n",
       "      <td>NaN</td>\n",
       "      <td>140.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>29</td>\n",
       "      <td>基于网络舆情大数据的公共政策评价研究</td>\n",
       "      <td>邱尔丽; 张竞; 王雨舟; 曹攀</td>\n",
       "      <td>领导科学</td>\n",
       "      <td>2021-04-16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>216.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>30</td>\n",
       "      <td>基于Mapreduce的多源多模态大数据检索方法研究</td>\n",
       "      <td>魏秀卓; 赵慧南</td>\n",
       "      <td>计算机仿真</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>71.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>31</td>\n",
       "      <td>从学习效果和教育公平的角度看高等教育人工智能应用——一项基于多个数据库英文同行评审期刊文献的综述</td>\n",
       "      <td>郝丹; 肖俊洪</td>\n",
       "      <td>现代教育技术</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>250.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>32</td>\n",
       "      <td>“城市仿真”大数据平台简介</td>\n",
       "      <td>NaN</td>\n",
       "      <td>交通运输系统工程与信息</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>44.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>33</td>\n",
       "      <td>人工智能非主体性前提下侵权责任承担机制研究</td>\n",
       "      <td>付其运</td>\n",
       "      <td>法学杂志</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>250.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>34</td>\n",
       "      <td>机用碳纤维/ABS复合材料人工智能辅助成型工艺关键技术研究</td>\n",
       "      <td>黄罡</td>\n",
       "      <td>化工新型材料</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>47.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>35</td>\n",
       "      <td>城市轨道交通勘测大数据的集成与应用</td>\n",
       "      <td>任传斌; 于淼; 李珂; 冯增文</td>\n",
       "      <td>地质论评</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>39.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>36</td>\n",
       "      <td>人工智能驱动下智慧养老服务模式构建研究</td>\n",
       "      <td>赵奕钧; 邓大松</td>\n",
       "      <td>江淮论坛</td>\n",
       "      <td>2021-04-12 10:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>980.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>37</td>\n",
       "      <td>电子科技大学周军教授团队在芯片奥林匹克会议ISSCC发表人工智能芯片论文</td>\n",
       "      <td>NaN</td>\n",
       "      <td>信息网络安全</td>\n",
       "      <td>2021-04-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>51.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>38</td>\n",
       "      <td>面向重大公共事务决策风险治理的大数据行动框架</td>\n",
       "      <td>毕凌燕; 张海璇; 左文明</td>\n",
       "      <td>科技管理研究</td>\n",
       "      <td>2021-04-10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>67.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>39</td>\n",
       "      <td>共智融合的大数据智能化人才培养研究与实践</td>\n",
       "      <td>冯永; 钟将; 王茜; 李学明</td>\n",
       "      <td>中国电化教育</td>\n",
       "      <td>2021-04-08</td>\n",
       "      <td>NaN</td>\n",
       "      <td>449.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>40</td>\n",
       "      <td>从教学样式到学习范式：人工智能环境下学习的通用设计转化</td>\n",
       "      <td>杨绪辉</td>\n",
       "      <td>中国电化教育</td>\n",
       "      <td>2021-04-08</td>\n",
       "      <td>NaN</td>\n",
       "      <td>336.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>41</td>\n",
       "      <td>人工智能教学中“知识建构、STEM、创客”三位一体教学模型的设计与应用</td>\n",
       "      <td>丁美荣; 王同聚</td>\n",
       "      <td>电化教育研究</td>\n",
       "      <td>2021-04-01</td>\n",
       "      <td>1.0</td>\n",
       "      <td>936.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>42</td>\n",
       "      <td>人工智能环境下广告创意人才的培养</td>\n",
       "      <td>赵朴</td>\n",
       "      <td>出版广角</td>\n",
       "      <td>2021-03-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>110.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>43</td>\n",
       "      <td>基于MapReduce的大数据在线聚集优化设计</td>\n",
       "      <td>李骏</td>\n",
       "      <td>河北大学学报(自然科学版)</td>\n",
       "      <td>2021-03-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>21.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>44</td>\n",
       "      <td>航空大数据研究综述</td>\n",
       "      <td>赵学武;吴宁;王军;阮利;李玲玲</td>\n",
       "      <td>计算机科学与探索</td>\n",
       "      <td>2021-03-23 16:56</td>\n",
       "      <td>NaN</td>\n",
       "      <td>412.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>45</td>\n",
       "      <td>人工智能技术的船舶航行轨迹控制算法</td>\n",
       "      <td>殷慧</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-03-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>60.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>46</td>\n",
       "      <td>大数据挖掘算法无人船信息管理系统</td>\n",
       "      <td>解莹</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-03-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>46.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>47</td>\n",
       "      <td>负责任的人工智能与设计创新</td>\n",
       "      <td>王韫; 徐迎庆</td>\n",
       "      <td>包装工程</td>\n",
       "      <td>2021-03-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>228.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>48</td>\n",
       "      <td>AI设计下的文本视觉问答技术</td>\n",
       "      <td>晋赞霞; 覃京燕; 殷绪成</td>\n",
       "      <td>包装工程</td>\n",
       "      <td>2021-03-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>54.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>49</td>\n",
       "      <td>AI设计下的智能驾驶场景文本识别技术</td>\n",
       "      <td>梁敏; 秦海波; 覃京燕; 殷绪成</td>\n",
       "      <td>包装工程</td>\n",
       "      <td>2021-03-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>143.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>50</td>\n",
       "      <td>唯物史观论域下人工智能的伦理问题思考与合伦理设计</td>\n",
       "      <td>田鹏颖; 周鑫</td>\n",
       "      <td>宁夏社会科学</td>\n",
       "      <td>2021-03-20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>355.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                                                 篇名  \\\n",
       "0            1                            森林生态站大数据快速存储与索引方法  网络首发   \n",
       "1            2  人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》   \n",
       "2            3                                 基于大数据分析的舰船装备寿命测试系统   \n",
       "3            4                               基于大数据与信息技术的拖拉机零部件供应链   \n",
       "4            5                              智能制造和大数据挖掘在农业机械设计中的应用   \n",
       "5            6                               基于特征加权的分布式大数据相关性挖掘方法   \n",
       "6            7                                基于AI的车载智能语音识别报警系统研制   \n",
       "7            8                                   人工智能教育的含义界定与原理挖掘   \n",
       "8            9                                     人工智能应用场景的界定与开发   \n",
       "9           10                 滚刀状态实时诊断技术在超大直径泥水盾构中的应用——以汕头苏埃通道为例   \n",
       "10          11                         近5年图情SSCI期刊人工智能伦理研究文献分析与启示   \n",
       "11          12                     教育信息化2.0背景下省级教育大数据平台建设研究  网络首发   \n",
       "12          13                                大数据挖掘技术的光流场图像匹配方法设计   \n",
       "13          14                                   大数据驱动的船舶航行路径跟踪研究   \n",
       "14          15                                  基于人工智能技术的船舶智能制造系统   \n",
       "15          16        大数据下基于机器学习的项目智能成本管理研究——以A风景园林规划研究院规划设计类项目为例   \n",
       "16          17                            新时期中欧人工智能发展战略与政策环境的比较研究   \n",
       "17          18                             大数据技术视域下智慧图书馆伦理危机与控制研究   \n",
       "18          19                         智能时代的中小学人工智能教育：总体定位与核心内容领域   \n",
       "19          20                              大数据环境下基于谱机器学习的云物流资源配置   \n",
       "20          21                               酶工程：从人工设计到人工智能  网络首发   \n",
       "21          22                           论技术向善何以可能——人工智能教育伦理的逻辑起点   \n",
       "22          23                        基于大数据的产品族本体造型意象挖掘方法研究  网络首发   \n",
       "23          24                             基于智能制造和大数据挖掘的农机数字化设计研究   \n",
       "24          25                                 语义分析及向量化大数据XSS入侵识别   \n",
       "25          26                         智能化学本评估初探——基于AI教师主讲课堂的试验研究   \n",
       "26          27                             大数据平台下化工企业消防安全风险分析指标设计   \n",
       "27          28                        知识牵引与数据驱动的兵棋AI设计及关键技术  网络首发   \n",
       "28          29                                 基于网络舆情大数据的公共政策评价研究   \n",
       "29          30                         基于Mapreduce的多源多模态大数据检索方法研究   \n",
       "30          31   从学习效果和教育公平的角度看高等教育人工智能应用——一项基于多个数据库英文同行评审期刊文献的综述   \n",
       "31          32                                      “城市仿真”大数据平台简介   \n",
       "32          33                              人工智能非主体性前提下侵权责任承担机制研究   \n",
       "33          34                      机用碳纤维/ABS复合材料人工智能辅助成型工艺关键技术研究   \n",
       "34          35                                  城市轨道交通勘测大数据的集成与应用   \n",
       "35          36                                人工智能驱动下智慧养老服务模式构建研究   \n",
       "36          37               电子科技大学周军教授团队在芯片奥林匹克会议ISSCC发表人工智能芯片论文   \n",
       "37          38                             面向重大公共事务决策风险治理的大数据行动框架   \n",
       "38          39                               共智融合的大数据智能化人才培养研究与实践   \n",
       "39          40                        从教学样式到学习范式：人工智能环境下学习的通用设计转化   \n",
       "40          41                人工智能教学中“知识建构、STEM、创客”三位一体教学模型的设计与应用   \n",
       "41          42                                   人工智能环境下广告创意人才的培养   \n",
       "42          43                            基于MapReduce的大数据在线聚集优化设计   \n",
       "43          44                                          航空大数据研究综述   \n",
       "44          45                                  人工智能技术的船舶航行轨迹控制算法   \n",
       "45          46                                   大数据挖掘算法无人船信息管理系统   \n",
       "46          47                                      负责任的人工智能与设计创新   \n",
       "47          48                                     AI设计下的文本视觉问答技术   \n",
       "48          49                                 AI设计下的智能驾驶场景文本识别技术   \n",
       "49          50                           唯物史观论域下人工智能的伦理问题思考与合伦理设计   \n",
       "\n",
       "                         作者             刊名              发表时间   被引      下载  操作  \\\n",
       "0    王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福         农业机械学报  2021-07-06 09:48  NaN     NaN  下载   \n",
       "1                       张诗雨           锻压技术        2021-06-25  NaN     8.0  下载   \n",
       "2                       化雪荟         舰船科学技术        2021-06-23  NaN     NaN  下载   \n",
       "3                        王弥          农机化研究        2021-06-15  NaN   104.0  下载   \n",
       "4                       杜伯阳          农机化研究        2021-06-15  NaN   186.0  下载   \n",
       "5                  戴惠丽; 王敬宇          计算机仿真        2021-06-15  NaN     NaN  下载   \n",
       "6              苏明; 艾海明; 王东明        传感器与微系统        2021-06-10  NaN   165.0  下载   \n",
       "7                       彭绍东         中国电化教育        2021-06-08  NaN   881.0  下载   \n",
       "8               李梦薇; 徐峰; 高芳         中国科技论坛        2021-06-05  NaN   123.0  下载   \n",
       "9   魏晓龙; 林福龙; 孟祥波; 周树亮; 郭俊可      隧道建设(中英文)  2021-06-01 09:56  NaN    78.0  下载   \n",
       "10        黄崑; 徐晓婷; 黎安润泽; 徐峰           现代情报        2021-06-01  NaN   671.0  下载   \n",
       "11                      汤岭球         当代教育论坛  2021-05-26 18:52  NaN   525.0  下载   \n",
       "12             黄凯宁; 郭有强; 杨静           激光杂志        2021-05-25  NaN    36.0  下载   \n",
       "13                       王冷         舰船科学技术        2021-05-23  NaN     9.0  下载   \n",
       "14                  聂华; 雷开元         舰船科学技术        2021-05-23  NaN    64.0  下载   \n",
       "15             程平; 彭兰雅; 辜榕容           财会通讯        2021-05-20  NaN   234.0  下载   \n",
       "16                  关皓元; 高杰          管理现代化  2021-05-17 15:21  NaN   342.0  下载   \n",
       "17               陆康; 刘慧; 曹畋        高校图书馆工作        2021-05-15  NaN   161.0  下载   \n",
       "18        卢宇; 汤筱玙; 宋佳宸; 余胜泉         中国远程教育        2021-05-12  NaN  1139.0  下载   \n",
       "19                 张人龙; 刘小红          统计与决策  2021-05-10 10:39  NaN   269.0  下载   \n",
       "20      王雅丽;付友思;陈俊宏;黄佳城;廖浪星           化工学报  2021-05-08 14:42  NaN   228.0  下载   \n",
       "21                     孙田琳子           高教探索        2021-05-05  NaN   181.0  下载   \n",
       "22                  王鹏; 朱韦龙           图学学报  2021-04-30 10:50  NaN   185.0  下载   \n",
       "23                  任燕; 崔庚彦          农机化研究        2021-04-28  NaN   238.0  下载   \n",
       "24                 张海军; 陈映辉  南开大学学报(自然科学版)        2021-04-20  NaN    18.0  下载   \n",
       "25            阮婷婷; 黄甫全; 曾文婕        教育研究与实验        2021-04-20  NaN    96.0  下载   \n",
       "26       王滨滨;褚新颖;程诚;王禹寒;胡文倩  南开大学学报(自然科学版)        2021-04-20  NaN    53.0  下载   \n",
       "27     程恺; 陈刚; 余晓晗; 刘满; 邵天浩      系统工程与电子技术  2021-04-19 08:31  NaN   140.0  下载   \n",
       "28         邱尔丽; 张竞; 王雨舟; 曹攀           领导科学        2021-04-16  NaN   216.0  下载   \n",
       "29                 魏秀卓; 赵慧南          计算机仿真        2021-04-15  NaN    71.0  下载   \n",
       "30                  郝丹; 肖俊洪         现代教育技术        2021-04-15  NaN   250.0  下载   \n",
       "31                      NaN    交通运输系统工程与信息        2021-04-15  NaN    44.0  下载   \n",
       "32                      付其运           法学杂志        2021-04-15  NaN   250.0  下载   \n",
       "33                       黄罡         化工新型材料        2021-04-15  NaN    47.0  下载   \n",
       "34         任传斌; 于淼; 李珂; 冯增文           地质论评        2021-04-15  NaN    39.0  下载   \n",
       "35                 赵奕钧; 邓大松           江淮论坛  2021-04-12 10:39  NaN   980.0  下载   \n",
       "36                      NaN         信息网络安全        2021-04-10  NaN    51.0  下载   \n",
       "37            毕凌燕; 张海璇; 左文明         科技管理研究        2021-04-10  NaN    67.0  下载   \n",
       "38          冯永; 钟将; 王茜; 李学明         中国电化教育        2021-04-08  NaN   449.0  下载   \n",
       "39                      杨绪辉         中国电化教育        2021-04-08  NaN   336.0  下载   \n",
       "40                 丁美荣; 王同聚         电化教育研究        2021-04-01  1.0   936.0  下载   \n",
       "41                       赵朴           出版广角        2021-03-30  NaN   110.0  下载   \n",
       "42                       李骏  河北大学学报(自然科学版)        2021-03-25  NaN    21.0  下载   \n",
       "43         赵学武;吴宁;王军;阮利;李玲玲       计算机科学与探索  2021-03-23 16:56  NaN   412.0  下载   \n",
       "44                       殷慧         舰船科学技术        2021-03-23  NaN    60.0  下载   \n",
       "45                       解莹         舰船科学技术        2021-03-23  NaN    46.0  下载   \n",
       "46                  王韫; 徐迎庆           包装工程        2021-03-20  NaN   228.0  下载   \n",
       "47            晋赞霞; 覃京燕; 殷绪成           包装工程        2021-03-20  NaN    54.0  下载   \n",
       "48        梁敏; 秦海波; 覃京燕; 殷绪成           包装工程        2021-03-20  NaN   143.0  下载   \n",
       "49                  田鹏颖; 周鑫         宁夏社会科学        2021-03-20  NaN   355.0  下载   \n",
       "\n",
       "                                                详细页链接  \\\n",
       "0   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "5   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "6   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "7   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "8   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "9   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "10  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "11  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "12  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "13  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "14  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "15  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "16  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "17  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "18  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "19  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "20  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "21  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "22  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "23  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "24  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "25  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "26  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "27  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "28  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "29  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "30  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "31  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "32  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "33  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "34  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "35  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "36  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "37  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "38  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "39  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "40  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "41  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "42  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "43  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "44  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "45  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "46  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "47  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "48  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "49  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                              PDF下载链接  \n",
       "0   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "5   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "6   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "7   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "8   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "9   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "10  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "11  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "12  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "13  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "14  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "15  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "16  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "17  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "18  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "19  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "20  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "21  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "22  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "23  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "24  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "25  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "26  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "27  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "28  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "29  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "30  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "31  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "32  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "33  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "34  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "35  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "36  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "37  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "38  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "39  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "40  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "41  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "42  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "43  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "44  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "45  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "46  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "47  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "48  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "49  https://kns.cnki.net/kcms/download.aspx?filena...  "
      ]
     },
     "execution_count": 67,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_pdf_links=pd.DataFrame({'PDF下载链接':pdf_href})\n",
    "df_页面表格=pd.concat([df_页面表格,df_pdf_links],axis=1)\n",
    "df_页面表格"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 翻页"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 68,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'下一页'"
      ]
     },
     "execution_count": 68,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 翻页\n",
    "element = driver.find_element_by_id('PageNext')\n",
    "element.get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 69,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'1/28'"
      ]
     },
     "execution_count": 69,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 翻页上限\n",
    "element = driver.find_element_by_xpath('//span[@class=\"countPageMark\"]')\n",
    "page_str = element.get_attribute('innerHTML')\n",
    "page_str "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 70,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['1', '28']"
      ]
     },
     "execution_count": 70,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "page_int = page_str.split('/')\n",
    "page_int"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 71,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28]\n"
     ]
    }
   ],
   "source": [
    "pages = list(range(1,int(page_int[1])+1))\n",
    "print(pages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 72,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 取前18页\n",
    "pages = [page for page in range(1,19)]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 73,
   "metadata": {},
   "outputs": [],
   "source": [
    "root_group=[]\n",
    "\n",
    "表格_html = dict()\n",
    "main_content =\"\"\n",
    "element = None\n",
    "\n",
    "# 函数（翻页）\n",
    "def page_process(pages):\n",
    "    for p in pages:\n",
    "        print(p,end='\\t')\n",
    "        # 定位到“下一页”的按钮 ——> 点击\n",
    "        driver.find_element_by_id('PageNext').click()\n",
    "        # 设定休息的时间 ——> 避免爬虫被禁报错\n",
    "        time.sleep(15)\n",
    "        \n",
    "        html=driver.page_source\n",
    "        root=fromstring(html)\n",
    "        root_group.append(root)\n",
    "        \n",
    "        # 获取含有页面主要数据的表格\n",
    "        element = driver.find_element_by_id('gridTable')\n",
    "        main_content = element.get_attribute('innerHTML')\n",
    "        表格_html[p] = main_content"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 74,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\t2\t3\t4\t5\t6\t7\t8\t9\t10\t11\t12\t13\t14\t15\t16\t17\t18\t"
     ]
    }
   ],
   "source": [
    "page_process(pages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 75,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>html_snippets</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                        html_snippets\n",
       "1   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "2   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "3   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "4   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "5   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "6   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "7   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "8   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "9   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "10  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "11  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "12  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "13  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "14  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "15  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "16  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "17  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "18  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ..."
      ]
     },
     "execution_count": 75,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.DataFrame([表格_html]).T\n",
    "df.columns = [\"html_snippets\"]\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 76,
   "metadata": {},
   "outputs": [],
   "source": [
    "link_df = []\n",
    "for p in pages:\n",
    "    表格 = pd.read_html(表格_html[p])[0]\n",
    "    link_df.append(表格)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 77,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>51</td>\n",
       "      <td>基于大数据糖尿病患者膳食管理系统的设计</td>\n",
       "      <td>章琦; 章玮; 白正玉</td>\n",
       "      <td>中国全科医学</td>\n",
       "      <td>2021-03-18</td>\n",
       "      <td>NaN</td>\n",
       "      <td>239</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>52</td>\n",
       "      <td>人工智能算法在铁道车辆动力学仿真中的应用进展</td>\n",
       "      <td>唐兆;董少迪;罗仁;蒋涛;邓锐</td>\n",
       "      <td>交通运输工程学报</td>\n",
       "      <td>2021-03-16 11:06</td>\n",
       "      <td>NaN</td>\n",
       "      <td>269</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>53</td>\n",
       "      <td>人工智能时代算法风险的法律规制论纲</td>\n",
       "      <td>胡小伟</td>\n",
       "      <td>湖北大学学报(哲学社会科学版)</td>\n",
       "      <td>2021-03-16</td>\n",
       "      <td>1.0</td>\n",
       "      <td>862</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>54</td>\n",
       "      <td>营销领域人工智能研究综述</td>\n",
       "      <td>林子筠; 吴琼琳; 才凤艳</td>\n",
       "      <td>外国经济与管理</td>\n",
       "      <td>2021-03-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1214</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>55</td>\n",
       "      <td>多特征级联图像数据库目标人工智能匹配仿真</td>\n",
       "      <td>徐颖慧; 晋国卿</td>\n",
       "      <td>计算机仿真</td>\n",
       "      <td>2021-03-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>29</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>895</th>\n",
       "      <td>946</td>\n",
       "      <td>基于大数据分析的智能电网降损效果估计模型仿真</td>\n",
       "      <td>吕守旭</td>\n",
       "      <td>中国电力</td>\n",
       "      <td>2017-04-05</td>\n",
       "      <td>6.0</td>\n",
       "      <td>237</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>896</th>\n",
       "      <td>947</td>\n",
       "      <td>基于大数据分析的电网精准规划信息系统设计</td>\n",
       "      <td>杨玉新; 马伟; 赵阳</td>\n",
       "      <td>现代电子技术</td>\n",
       "      <td>2017-04-01</td>\n",
       "      <td>18.0</td>\n",
       "      <td>194</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>897</th>\n",
       "      <td>948</td>\n",
       "      <td>基于大数据的多媒体画面语言研究</td>\n",
       "      <td>王志军; 吴向文; 冯小燕; 温小勇</td>\n",
       "      <td>电化教育研究</td>\n",
       "      <td>2017-04-01</td>\n",
       "      <td>15.0</td>\n",
       "      <td>1091</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>898</th>\n",
       "      <td>949</td>\n",
       "      <td>大数据时代信息隐私的保护问题研究</td>\n",
       "      <td>李延舜</td>\n",
       "      <td>河南社会科学</td>\n",
       "      <td>2017-04-01</td>\n",
       "      <td>42.0</td>\n",
       "      <td>1227</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>899</th>\n",
       "      <td>950</td>\n",
       "      <td>大数据网络协作传输优化编码方法</td>\n",
       "      <td>孙媛</td>\n",
       "      <td>科技通报</td>\n",
       "      <td>2017-03-31</td>\n",
       "      <td>5.0</td>\n",
       "      <td>50</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>900 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0                      篇名                  作者               刊名  \\\n",
       "0            51     基于大数据糖尿病患者膳食管理系统的设计         章琦; 章玮; 白正玉           中国全科医学   \n",
       "1            52  人工智能算法在铁道车辆动力学仿真中的应用进展     唐兆;董少迪;罗仁;蒋涛;邓锐         交通运输工程学报   \n",
       "2            53       人工智能时代算法风险的法律规制论纲                 胡小伟  湖北大学学报(哲学社会科学版)   \n",
       "3            54            营销领域人工智能研究综述       林子筠; 吴琼琳; 才凤艳          外国经济与管理   \n",
       "4            55    多特征级联图像数据库目标人工智能匹配仿真            徐颖慧; 晋国卿            计算机仿真   \n",
       "..          ...                     ...                 ...              ...   \n",
       "895         946  基于大数据分析的智能电网降损效果估计模型仿真                 吕守旭             中国电力   \n",
       "896         947    基于大数据分析的电网精准规划信息系统设计         杨玉新; 马伟; 赵阳           现代电子技术   \n",
       "897         948         基于大数据的多媒体画面语言研究  王志军; 吴向文; 冯小燕; 温小勇           电化教育研究   \n",
       "898         949        大数据时代信息隐私的保护问题研究                 李延舜           河南社会科学   \n",
       "899         950         大数据网络协作传输优化编码方法                  孙媛             科技通报   \n",
       "\n",
       "                 发表时间    被引    下载  操作  \n",
       "0          2021-03-18   NaN   239  下载  \n",
       "1    2021-03-16 11:06   NaN   269  下载  \n",
       "2          2021-03-16   1.0   862  下载  \n",
       "3          2021-03-15   NaN  1214  下载  \n",
       "4          2021-03-15   NaN    29  下载  \n",
       "..                ...   ...   ...  ..  \n",
       "895        2017-04-05   6.0   237  下载  \n",
       "896        2017-04-01  18.0   194  下载  \n",
       "897        2017-04-01  15.0  1091  下载  \n",
       "898        2017-04-01  42.0  1227  下载  \n",
       "899        2017-03-31   5.0    50  下载  \n",
       "\n",
       "[900 rows x 8 columns]"
      ]
     },
     "execution_count": 77,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_url_out = pd.concat(link_df).reset_index(drop=True)\n",
    "df_url_out"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 78,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 详细页链接\n",
    "href_group=[]\n",
    "\n",
    "for root in root_group:\n",
    "    href = root.xpath('.//*[@id=\"gridTable\"]/table/tbody/tr/td[2]/a/@href')\n",
    "    href_group.append(href)\n",
    "    \n",
    "href_group=href_group[0]+href_group[1]+href_group[2]+href_group[3]+href_group[4]+href_group[5]+href_group[6]+href_group[7]+href_group[8]+href_group[9]+href_group[10]+href_group[11]+href_group[12]+href_group[13]+href_group[14]+href_group[15]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 79,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>详细页链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 1 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 详细页链接\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "..                                                 ...\n",
       "795  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "796  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "797  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "798  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "799  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "\n",
       "[800 rows x 1 columns]"
      ]
     },
     "execution_count": 79,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "href_group_correct=[correct(x) for x in href_group]\n",
    "df_link=pd.DataFrame({'详细页链接':href_group_correct})\n",
    "df_link"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 80,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\n",
      "2\n",
      "3\n",
      "4\n",
      "5\n",
      "6\n",
      "7\n",
      "8\n",
      "9\n",
      "10\n",
      "11\n",
      "12\n",
      "13\n",
      "14\n",
      "15\n",
      "16\n",
      "17\n",
      "18\n",
      "19\n",
      "20\n",
      "21\n",
      "22\n",
      "23\n",
      "24\n",
      "25\n",
      "26\n",
      "27\n",
      "28\n",
      "29\n",
      "30\n",
      "31\n",
      "32\n",
      "33\n",
      "34\n",
      "35\n",
      "36\n",
      "37\n",
      "38\n",
      "39\n",
      "40\n",
      "41\n",
      "42\n",
      "43\n",
      "44\n",
      "45\n",
      "46\n",
      "47\n",
      "48\n",
      "49\n",
      "50\n",
      "51\n",
      "52\n",
      "53\n",
      "54\n",
      "55\n",
      "56\n",
      "57\n",
      "58\n",
      "59\n",
      "60\n",
      "61\n",
      "62\n",
      "63\n",
      "64\n",
      "65\n",
      "66\n",
      "67\n",
      "68\n",
      "69\n",
      "70\n",
      "71\n",
      "72\n",
      "73\n",
      "74\n",
      "75\n",
      "76\n",
      "77\n",
      "78\n",
      "79\n",
      "80\n",
      "81\n",
      "82\n",
      "83\n",
      "84\n",
      "85\n",
      "86\n",
      "87\n",
      "88\n",
      "89\n",
      "90\n",
      "91\n",
      "92\n",
      "93\n",
      "94\n",
      "95\n",
      "96\n",
      "97\n",
      "98\n",
      "99\n",
      "100\n",
      "101\n",
      "102\n",
      "103\n",
      "104\n",
      "105\n",
      "106\n",
      "107\n",
      "108\n",
      "109\n",
      "110\n",
      "111\n",
      "112\n",
      "113\n",
      "114\n",
      "115\n",
      "116\n",
      "117\n",
      "118\n",
      "119\n",
      "120\n",
      "121\n",
      "122\n",
      "123\n",
      "124\n",
      "125\n",
      "126\n",
      "127\n",
      "128\n",
      "129\n",
      "130\n",
      "131\n",
      "132\n",
      "133\n",
      "134\n",
      "135\n",
      "136\n",
      "137\n",
      "138\n",
      "139\n",
      "140\n",
      "141\n",
      "142\n",
      "143\n",
      "144\n",
      "145\n",
      "146\n",
      "147\n",
      "148\n",
      "149\n",
      "150\n",
      "151\n",
      "152\n",
      "153\n",
      "154\n",
      "155\n",
      "156\n",
      "157\n",
      "158\n",
      "159\n",
      "160\n",
      "161\n",
      "162\n",
      "163\n",
      "164\n",
      "165\n",
      "166\n",
      "167\n",
      "168\n",
      "169\n",
      "170\n",
      "171\n",
      "172\n",
      "173\n",
      "174\n",
      "175\n",
      "176\n",
      "177\n",
      "178\n",
      "179\n",
      "180\n",
      "181\n",
      "182\n",
      "183\n",
      "184\n",
      "185\n",
      "186\n",
      "187\n",
      "188\n",
      "189\n",
      "190\n",
      "191\n",
      "192\n",
      "193\n",
      "194\n",
      "195\n",
      "196\n",
      "197\n",
      "198\n",
      "199\n",
      "200\n",
      "201\n",
      "202\n",
      "203\n",
      "204\n",
      "205\n",
      "206\n",
      "207\n",
      "208\n",
      "209\n",
      "210\n",
      "211\n",
      "212\n",
      "213\n",
      "214\n",
      "215\n",
      "216\n",
      "217\n",
      "218\n",
      "219\n",
      "220\n",
      "221\n",
      "222\n",
      "223\n",
      "224\n",
      "225\n",
      "226\n",
      "227\n",
      "228\n",
      "229\n",
      "230\n",
      "231\n",
      "232\n",
      "233\n",
      "234\n",
      "235\n",
      "236\n",
      "237\n",
      "238\n",
      "239\n",
      "240\n",
      "241\n",
      "242\n",
      "243\n",
      "244\n",
      "245\n",
      "246\n",
      "247\n",
      "248\n",
      "249\n",
      "250\n",
      "251\n",
      "252\n",
      "253\n",
      "254\n",
      "255\n",
      "256\n",
      "257\n",
      "258\n",
      "259\n",
      "260\n",
      "261\n",
      "262\n",
      "263\n",
      "264\n",
      "265\n",
      "266\n",
      "267\n",
      "268\n",
      "269\n",
      "270\n",
      "271\n",
      "272\n",
      "273\n",
      "274\n",
      "275\n",
      "276\n",
      "277\n",
      "278\n",
      "279\n",
      "280\n",
      "281\n",
      "282\n",
      "283\n",
      "284\n",
      "285\n",
      "286\n",
      "287\n",
      "288\n",
      "289\n",
      "290\n",
      "291\n",
      "292\n",
      "293\n",
      "294\n",
      "295\n",
      "296\n",
      "297\n",
      "298\n",
      "299\n",
      "300\n",
      "301\n",
      "302\n",
      "303\n",
      "304\n",
      "305\n",
      "306\n",
      "307\n",
      "308\n",
      "309\n",
      "310\n",
      "311\n",
      "312\n",
      "313\n",
      "314\n",
      "315\n",
      "316\n",
      "317\n",
      "318\n",
      "319\n",
      "320\n",
      "321\n",
      "322\n",
      "323\n",
      "324\n",
      "325\n",
      "326\n",
      "327\n",
      "328\n",
      "329\n",
      "330\n",
      "331\n",
      "332\n",
      "333\n",
      "334\n",
      "335\n",
      "336\n",
      "337\n",
      "338\n",
      "339\n",
      "340\n",
      "341\n",
      "342\n",
      "343\n",
      "344\n",
      "345\n",
      "346\n",
      "347\n",
      "348\n",
      "349\n",
      "350\n",
      "351\n",
      "352\n",
      "353\n",
      "354\n",
      "355\n",
      "356\n",
      "357\n",
      "358\n",
      "359\n",
      "360\n",
      "361\n",
      "362\n",
      "363\n",
      "364\n",
      "365\n",
      "366\n",
      "367\n",
      "368\n",
      "369\n",
      "370\n",
      "371\n",
      "372\n",
      "373\n",
      "374\n",
      "375\n",
      "376\n",
      "377\n",
      "378\n",
      "379\n",
      "380\n",
      "381\n",
      "382\n",
      "383\n",
      "384\n",
      "385\n",
      "386\n",
      "387\n",
      "388\n",
      "389\n",
      "390\n",
      "391\n",
      "392\n",
      "393\n",
      "394\n",
      "395\n",
      "396\n",
      "397\n",
      "398\n",
      "399\n",
      "400\n",
      "401\n",
      "402\n",
      "403\n",
      "404\n",
      "405\n",
      "406\n",
      "407\n",
      "408\n",
      "409\n",
      "410\n",
      "411\n",
      "412\n",
      "413\n",
      "414\n",
      "415\n",
      "416\n",
      "417\n",
      "418\n",
      "419\n",
      "420\n",
      "421\n",
      "422\n",
      "423\n",
      "424\n",
      "425\n",
      "426\n",
      "427\n",
      "428\n",
      "429\n",
      "430\n",
      "431\n",
      "432\n",
      "433\n",
      "434\n",
      "435\n",
      "436\n",
      "437\n",
      "438\n",
      "439\n",
      "440\n",
      "441\n",
      "442\n",
      "443\n",
      "444\n",
      "445\n",
      "446\n",
      "447\n",
      "448\n",
      "449\n",
      "450\n",
      "451\n",
      "452\n",
      "453\n",
      "454\n",
      "455\n",
      "456\n",
      "457\n",
      "458\n",
      "459\n",
      "460\n",
      "461\n",
      "462\n",
      "463\n",
      "464\n",
      "465\n",
      "466\n",
      "467\n",
      "468\n",
      "469\n",
      "470\n",
      "471\n",
      "472\n",
      "473\n",
      "474\n",
      "475\n",
      "476\n",
      "477\n",
      "478\n",
      "479\n",
      "480\n",
      "481\n",
      "482\n",
      "483\n",
      "484\n",
      "485\n",
      "486\n",
      "487\n",
      "488\n",
      "489\n",
      "490\n",
      "491\n",
      "492\n",
      "493\n",
      "494\n",
      "495\n",
      "496\n",
      "497\n",
      "498\n",
      "499\n",
      "500\n",
      "501\n",
      "502\n",
      "503\n",
      "504\n",
      "505\n",
      "506\n",
      "507\n",
      "508\n",
      "509\n",
      "510\n",
      "511\n",
      "512\n",
      "513\n",
      "514\n",
      "515\n",
      "516\n",
      "517\n",
      "518\n",
      "519\n",
      "520\n",
      "521\n",
      "522\n",
      "523\n",
      "524\n",
      "525\n",
      "526\n",
      "527\n",
      "528\n",
      "529\n",
      "530\n",
      "531\n",
      "532\n",
      "533\n",
      "534\n",
      "535\n",
      "536\n",
      "537\n",
      "538\n",
      "539\n",
      "540\n",
      "541\n",
      "542\n",
      "543\n",
      "544\n",
      "545\n",
      "546\n",
      "547\n",
      "548\n",
      "549\n",
      "550\n",
      "551\n",
      "552\n",
      "553\n",
      "554\n",
      "555\n",
      "556\n",
      "557\n",
      "558\n",
      "559\n",
      "560\n",
      "561\n",
      "562\n",
      "563\n",
      "564\n",
      "565\n",
      "566\n",
      "567\n",
      "568\n",
      "569\n",
      "570\n",
      "571\n",
      "572\n",
      "573\n",
      "574\n",
      "575\n",
      "576\n",
      "577\n",
      "578\n",
      "579\n",
      "580\n",
      "581\n",
      "582\n",
      "583\n",
      "584\n",
      "585\n",
      "586\n",
      "587\n",
      "588\n",
      "589\n",
      "590\n",
      "591\n",
      "592\n",
      "593\n",
      "594\n",
      "595\n",
      "596\n",
      "597\n",
      "598\n",
      "599\n",
      "600\n",
      "601\n",
      "602\n",
      "603\n",
      "604\n",
      "605\n",
      "606\n",
      "607\n",
      "608\n",
      "609\n",
      "610\n",
      "611\n",
      "612\n",
      "613\n",
      "614\n",
      "615\n",
      "616\n",
      "617\n",
      "618\n",
      "619\n",
      "620\n",
      "621\n",
      "622\n",
      "623\n",
      "624\n",
      "625\n",
      "626\n",
      "627\n",
      "628\n",
      "629\n",
      "630\n",
      "631\n",
      "632\n",
      "633\n",
      "634\n",
      "635\n",
      "636\n",
      "637\n",
      "638\n",
      "639\n",
      "640\n",
      "641\n",
      "642\n",
      "643\n",
      "644\n",
      "645\n",
      "646\n",
      "647\n",
      "648\n",
      "649\n",
      "650\n",
      "651\n",
      "652\n",
      "653\n",
      "654\n",
      "655\n",
      "656\n",
      "657\n",
      "658\n",
      "659\n",
      "660\n",
      "661\n",
      "662\n",
      "663\n",
      "664\n",
      "665\n",
      "666\n",
      "667\n",
      "668\n",
      "669\n",
      "670\n",
      "671\n",
      "672\n",
      "673\n",
      "674\n",
      "675\n",
      "676\n",
      "677\n",
      "678\n",
      "679\n",
      "680\n",
      "681\n",
      "682\n",
      "683\n",
      "684\n",
      "685\n",
      "686\n",
      "687\n",
      "688\n",
      "689\n",
      "690\n",
      "691\n",
      "692\n",
      "693\n",
      "694\n",
      "695\n",
      "696\n",
      "697\n",
      "698\n",
      "699\n",
      "700\n",
      "701\n",
      "702\n",
      "703\n",
      "704\n",
      "705\n",
      "706\n",
      "707\n",
      "708\n"
     ]
    }
   ],
   "source": [
    "# PDF下载链接\n",
    "pdf_links=[]\n",
    "link_num = 0\n",
    "\n",
    "for url in href_group_correct:\n",
    "    try:\n",
    "        r = session.get(url)\n",
    "        pdf_link_xpath=r.html.xpath('//*[@id=\"pdfDown\"]/@href')[1]\n",
    "        pdf_links.append(pdf_link_xpath)\n",
    "        link_num += 1\n",
    "        print(link_num)\n",
    "    except:\n",
    "        continue\n",
    "    time.sleep(10)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 82,
   "metadata": {},
   "outputs": [],
   "source": [
    "pdf_links_correct=['https://kns.cnki.net'+link for link in pdf_links]\n",
    "df_pdf_download=pd.DataFrame({'PDF下载链接':pdf_links_correct})"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 83,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>703</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>704</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>705</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>706</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>707</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>708 rows × 1 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                               PDF下载链接\n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "..                                                 ...\n",
       "703  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "704  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "705  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "706  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "707  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "\n",
       "[708 rows x 1 columns]"
      ]
     },
     "execution_count": 83,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_pdf_download"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 84,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 详细页链接  \\\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "..                                                 ...   \n",
       "795  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "796  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "797  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "798  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "799  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                               PDF下载链接  \n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "..                                                 ...  \n",
       "795                                                NaN  \n",
       "796                                                NaN  \n",
       "797                                                NaN  \n",
       "798                                                NaN  \n",
       "799                                                NaN  \n",
       "\n",
       "[800 rows x 2 columns]"
      ]
     },
     "execution_count": 84,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_链接列表合并=pd.concat([df_link,df_pdf_download],axis=1)\n",
    "df_链接列表合并"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 85,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>51</td>\n",
       "      <td>基于大数据糖尿病患者膳食管理系统的设计</td>\n",
       "      <td>章琦; 章玮; 白正玉</td>\n",
       "      <td>中国全科医学</td>\n",
       "      <td>2021-03-18</td>\n",
       "      <td>NaN</td>\n",
       "      <td>239</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>52</td>\n",
       "      <td>人工智能算法在铁道车辆动力学仿真中的应用进展</td>\n",
       "      <td>唐兆;董少迪;罗仁;蒋涛;邓锐</td>\n",
       "      <td>交通运输工程学报</td>\n",
       "      <td>2021-03-16 11:06</td>\n",
       "      <td>NaN</td>\n",
       "      <td>269</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>53</td>\n",
       "      <td>人工智能时代算法风险的法律规制论纲</td>\n",
       "      <td>胡小伟</td>\n",
       "      <td>湖北大学学报(哲学社会科学版)</td>\n",
       "      <td>2021-03-16</td>\n",
       "      <td>1.0</td>\n",
       "      <td>862</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>54</td>\n",
       "      <td>营销领域人工智能研究综述</td>\n",
       "      <td>林子筠; 吴琼琳; 才凤艳</td>\n",
       "      <td>外国经济与管理</td>\n",
       "      <td>2021-03-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1214</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>55</td>\n",
       "      <td>多特征级联图像数据库目标人工智能匹配仿真</td>\n",
       "      <td>徐颖慧; 晋国卿</td>\n",
       "      <td>计算机仿真</td>\n",
       "      <td>2021-03-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>29</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>895</th>\n",
       "      <td>946</td>\n",
       "      <td>基于大数据分析的智能电网降损效果估计模型仿真</td>\n",
       "      <td>吕守旭</td>\n",
       "      <td>中国电力</td>\n",
       "      <td>2017-04-05</td>\n",
       "      <td>6.0</td>\n",
       "      <td>237</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>896</th>\n",
       "      <td>947</td>\n",
       "      <td>基于大数据分析的电网精准规划信息系统设计</td>\n",
       "      <td>杨玉新; 马伟; 赵阳</td>\n",
       "      <td>现代电子技术</td>\n",
       "      <td>2017-04-01</td>\n",
       "      <td>18.0</td>\n",
       "      <td>194</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>897</th>\n",
       "      <td>948</td>\n",
       "      <td>基于大数据的多媒体画面语言研究</td>\n",
       "      <td>王志军; 吴向文; 冯小燕; 温小勇</td>\n",
       "      <td>电化教育研究</td>\n",
       "      <td>2017-04-01</td>\n",
       "      <td>15.0</td>\n",
       "      <td>1091</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>898</th>\n",
       "      <td>949</td>\n",
       "      <td>大数据时代信息隐私的保护问题研究</td>\n",
       "      <td>李延舜</td>\n",
       "      <td>河南社会科学</td>\n",
       "      <td>2017-04-01</td>\n",
       "      <td>42.0</td>\n",
       "      <td>1227</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>899</th>\n",
       "      <td>950</td>\n",
       "      <td>大数据网络协作传输优化编码方法</td>\n",
       "      <td>孙媛</td>\n",
       "      <td>科技通报</td>\n",
       "      <td>2017-03-31</td>\n",
       "      <td>5.0</td>\n",
       "      <td>50</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>900 rows × 10 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0                      篇名                  作者               刊名  \\\n",
       "0            51     基于大数据糖尿病患者膳食管理系统的设计         章琦; 章玮; 白正玉           中国全科医学   \n",
       "1            52  人工智能算法在铁道车辆动力学仿真中的应用进展     唐兆;董少迪;罗仁;蒋涛;邓锐         交通运输工程学报   \n",
       "2            53       人工智能时代算法风险的法律规制论纲                 胡小伟  湖北大学学报(哲学社会科学版)   \n",
       "3            54            营销领域人工智能研究综述       林子筠; 吴琼琳; 才凤艳          外国经济与管理   \n",
       "4            55    多特征级联图像数据库目标人工智能匹配仿真            徐颖慧; 晋国卿            计算机仿真   \n",
       "..          ...                     ...                 ...              ...   \n",
       "895         946  基于大数据分析的智能电网降损效果估计模型仿真                 吕守旭             中国电力   \n",
       "896         947    基于大数据分析的电网精准规划信息系统设计         杨玉新; 马伟; 赵阳           现代电子技术   \n",
       "897         948         基于大数据的多媒体画面语言研究  王志军; 吴向文; 冯小燕; 温小勇           电化教育研究   \n",
       "898         949        大数据时代信息隐私的保护问题研究                 李延舜           河南社会科学   \n",
       "899         950         大数据网络协作传输优化编码方法                  孙媛             科技通报   \n",
       "\n",
       "                 发表时间    被引    下载  操作  \\\n",
       "0          2021-03-18   NaN   239  下载   \n",
       "1    2021-03-16 11:06   NaN   269  下载   \n",
       "2          2021-03-16   1.0   862  下载   \n",
       "3          2021-03-15   NaN  1214  下载   \n",
       "4          2021-03-15   NaN    29  下载   \n",
       "..                ...   ...   ...  ..   \n",
       "895        2017-04-05   6.0   237  下载   \n",
       "896        2017-04-01  18.0   194  下载   \n",
       "897        2017-04-01  15.0  1091  下载   \n",
       "898        2017-04-01  42.0  1227  下载   \n",
       "899        2017-03-31   5.0    50  下载   \n",
       "\n",
       "                                                 详细页链接  \\\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "..                                                 ...   \n",
       "895                                                NaN   \n",
       "896                                                NaN   \n",
       "897                                                NaN   \n",
       "898                                                NaN   \n",
       "899                                                NaN   \n",
       "\n",
       "                                               PDF下载链接  \n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "..                                                 ...  \n",
       "895                                                NaN  \n",
       "896                                                NaN  \n",
       "897                                                NaN  \n",
       "898                                                NaN  \n",
       "899                                                NaN  \n",
       "\n",
       "[900 rows x 10 columns]"
      ]
     },
     "execution_count": 85,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_合并=pd.concat([df_url_out,df_链接列表合并],axis=1)\n",
    "df_合并"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 86,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>index</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>森林生态站大数据快速存储与索引方法  网络首发</td>\n",
       "      <td>王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福</td>\n",
       "      <td>农业机械学报</td>\n",
       "      <td>2021-07-06 09:48</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》</td>\n",
       "      <td>张诗雨</td>\n",
       "      <td>锻压技术</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>8.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>基于大数据分析的舰船装备寿命测试系统</td>\n",
       "      <td>化雪荟</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-06-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>基于大数据与信息技术的拖拉机零部件供应链</td>\n",
       "      <td>王弥</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>104.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>5</td>\n",
       "      <td>智能制造和大数据挖掘在农业机械设计中的应用</td>\n",
       "      <td>杜伯阳</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>186.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>945</th>\n",
       "      <td>895</td>\n",
       "      <td>946</td>\n",
       "      <td>基于大数据分析的智能电网降损效果估计模型仿真</td>\n",
       "      <td>吕守旭</td>\n",
       "      <td>中国电力</td>\n",
       "      <td>2017-04-05</td>\n",
       "      <td>6.0</td>\n",
       "      <td>237.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>946</th>\n",
       "      <td>896</td>\n",
       "      <td>947</td>\n",
       "      <td>基于大数据分析的电网精准规划信息系统设计</td>\n",
       "      <td>杨玉新; 马伟; 赵阳</td>\n",
       "      <td>现代电子技术</td>\n",
       "      <td>2017-04-01</td>\n",
       "      <td>18.0</td>\n",
       "      <td>194.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>947</th>\n",
       "      <td>897</td>\n",
       "      <td>948</td>\n",
       "      <td>基于大数据的多媒体画面语言研究</td>\n",
       "      <td>王志军; 吴向文; 冯小燕; 温小勇</td>\n",
       "      <td>电化教育研究</td>\n",
       "      <td>2017-04-01</td>\n",
       "      <td>15.0</td>\n",
       "      <td>1091.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>948</th>\n",
       "      <td>898</td>\n",
       "      <td>949</td>\n",
       "      <td>大数据时代信息隐私的保护问题研究</td>\n",
       "      <td>李延舜</td>\n",
       "      <td>河南社会科学</td>\n",
       "      <td>2017-04-01</td>\n",
       "      <td>42.0</td>\n",
       "      <td>1227.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>949</th>\n",
       "      <td>899</td>\n",
       "      <td>950</td>\n",
       "      <td>大数据网络协作传输优化编码方法</td>\n",
       "      <td>孙媛</td>\n",
       "      <td>科技通报</td>\n",
       "      <td>2017-03-31</td>\n",
       "      <td>5.0</td>\n",
       "      <td>50.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>950 rows × 11 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     index  Unnamed: 0                                                 篇名  \\\n",
       "0        0           1                            森林生态站大数据快速存储与索引方法  网络首发   \n",
       "1        1           2  人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》   \n",
       "2        2           3                                 基于大数据分析的舰船装备寿命测试系统   \n",
       "3        3           4                               基于大数据与信息技术的拖拉机零部件供应链   \n",
       "4        4           5                              智能制造和大数据挖掘在农业机械设计中的应用   \n",
       "..     ...         ...                                                ...   \n",
       "945    895         946                             基于大数据分析的智能电网降损效果估计模型仿真   \n",
       "946    896         947                               基于大数据分析的电网精准规划信息系统设计   \n",
       "947    897         948                                    基于大数据的多媒体画面语言研究   \n",
       "948    898         949                                   大数据时代信息隐私的保护问题研究   \n",
       "949    899         950                                    大数据网络协作传输优化编码方法   \n",
       "\n",
       "                         作者      刊名              发表时间    被引      下载  操作  \\\n",
       "0    王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福  农业机械学报  2021-07-06 09:48   NaN     NaN  下载   \n",
       "1                       张诗雨    锻压技术        2021-06-25   NaN     8.0  下载   \n",
       "2                       化雪荟  舰船科学技术        2021-06-23   NaN     NaN  下载   \n",
       "3                        王弥   农机化研究        2021-06-15   NaN   104.0  下载   \n",
       "4                       杜伯阳   农机化研究        2021-06-15   NaN   186.0  下载   \n",
       "..                      ...     ...               ...   ...     ...  ..   \n",
       "945                     吕守旭    中国电力        2017-04-05   6.0   237.0  下载   \n",
       "946             杨玉新; 马伟; 赵阳  现代电子技术        2017-04-01  18.0   194.0  下载   \n",
       "947      王志军; 吴向文; 冯小燕; 温小勇  电化教育研究        2017-04-01  15.0  1091.0  下载   \n",
       "948                     李延舜  河南社会科学        2017-04-01  42.0  1227.0  下载   \n",
       "949                      孙媛    科技通报        2017-03-31   5.0    50.0  下载   \n",
       "\n",
       "                                                 详细页链接  \\\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "..                                                 ...   \n",
       "945                                                NaN   \n",
       "946                                                NaN   \n",
       "947                                                NaN   \n",
       "948                                                NaN   \n",
       "949                                                NaN   \n",
       "\n",
       "                                               PDF下载链接  \n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "..                                                 ...  \n",
       "945                                                NaN  \n",
       "946                                                NaN  \n",
       "947                                                NaN  \n",
       "948                                                NaN  \n",
       "949                                                NaN  \n",
       "\n",
       "[950 rows x 11 columns]"
      ]
     },
     "execution_count": 86,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_总表 = df_页面表格.append(df_合并).reset_index()\n",
    "df_总表"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 87,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>index</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>森林生态站大数据快速存储与索引方法  网络首发</td>\n",
       "      <td>王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福</td>\n",
       "      <td>农业机械学报</td>\n",
       "      <td>2021-07-06 09:48</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》</td>\n",
       "      <td>张诗雨</td>\n",
       "      <td>锻压技术</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>8.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>基于大数据分析的舰船装备寿命测试系统</td>\n",
       "      <td>化雪荟</td>\n",
       "      <td>舰船科学技术</td>\n",
       "      <td>2021-06-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>基于大数据与信息技术的拖拉机零部件供应链</td>\n",
       "      <td>王弥</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>104.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>5</td>\n",
       "      <td>智能制造和大数据挖掘在农业机械设计中的应用</td>\n",
       "      <td>杜伯阳</td>\n",
       "      <td>农机化研究</td>\n",
       "      <td>2021-06-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>186.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>945</th>\n",
       "      <td>895</td>\n",
       "      <td>946</td>\n",
       "      <td>基于大数据分析的智能电网降损效果估计模型仿真</td>\n",
       "      <td>吕守旭</td>\n",
       "      <td>中国电力</td>\n",
       "      <td>2017-04-05</td>\n",
       "      <td>6.0</td>\n",
       "      <td>237.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>946</th>\n",
       "      <td>896</td>\n",
       "      <td>947</td>\n",
       "      <td>基于大数据分析的电网精准规划信息系统设计</td>\n",
       "      <td>杨玉新; 马伟; 赵阳</td>\n",
       "      <td>现代电子技术</td>\n",
       "      <td>2017-04-01</td>\n",
       "      <td>18.0</td>\n",
       "      <td>194.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>947</th>\n",
       "      <td>897</td>\n",
       "      <td>948</td>\n",
       "      <td>基于大数据的多媒体画面语言研究</td>\n",
       "      <td>王志军; 吴向文; 冯小燕; 温小勇</td>\n",
       "      <td>电化教育研究</td>\n",
       "      <td>2017-04-01</td>\n",
       "      <td>15.0</td>\n",
       "      <td>1091.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>948</th>\n",
       "      <td>898</td>\n",
       "      <td>949</td>\n",
       "      <td>大数据时代信息隐私的保护问题研究</td>\n",
       "      <td>李延舜</td>\n",
       "      <td>河南社会科学</td>\n",
       "      <td>2017-04-01</td>\n",
       "      <td>42.0</td>\n",
       "      <td>1227.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>949</th>\n",
       "      <td>899</td>\n",
       "      <td>950</td>\n",
       "      <td>大数据网络协作传输优化编码方法</td>\n",
       "      <td>孙媛</td>\n",
       "      <td>科技通报</td>\n",
       "      <td>2017-03-31</td>\n",
       "      <td>5.0</td>\n",
       "      <td>50.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>950 rows × 11 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     index  Unnamed: 0                                                 篇名  \\\n",
       "0        0           1                            森林生态站大数据快速存储与索引方法  网络首发   \n",
       "1        1           2  人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》   \n",
       "2        2           3                                 基于大数据分析的舰船装备寿命测试系统   \n",
       "3        3           4                               基于大数据与信息技术的拖拉机零部件供应链   \n",
       "4        4           5                              智能制造和大数据挖掘在农业机械设计中的应用   \n",
       "..     ...         ...                                                ...   \n",
       "945    895         946                             基于大数据分析的智能电网降损效果估计模型仿真   \n",
       "946    896         947                               基于大数据分析的电网精准规划信息系统设计   \n",
       "947    897         948                                    基于大数据的多媒体画面语言研究   \n",
       "948    898         949                                   大数据时代信息隐私的保护问题研究   \n",
       "949    899         950                                    大数据网络协作传输优化编码方法   \n",
       "\n",
       "                         作者      刊名              发表时间    被引      下载  操作  \\\n",
       "0    王新阳; 贾相宇; 陈志泊; 崔晓晖; 许福  农业机械学报  2021-07-06 09:48   NaN     NaN  下载   \n",
       "1                       张诗雨    锻压技术        2021-06-25   NaN     8.0  下载   \n",
       "2                       化雪荟  舰船科学技术        2021-06-23   NaN     NaN  下载   \n",
       "3                        王弥   农机化研究        2021-06-15   NaN   104.0  下载   \n",
       "4                       杜伯阳   农机化研究        2021-06-15   NaN   186.0  下载   \n",
       "..                      ...     ...               ...   ...     ...  ..   \n",
       "945                     吕守旭    中国电力        2017-04-05   6.0   237.0  下载   \n",
       "946             杨玉新; 马伟; 赵阳  现代电子技术        2017-04-01  18.0   194.0  下载   \n",
       "947      王志军; 吴向文; 冯小燕; 温小勇  电化教育研究        2017-04-01  15.0  1091.0  下载   \n",
       "948                     李延舜  河南社会科学        2017-04-01  42.0  1227.0  下载   \n",
       "949                      孙媛    科技通报        2017-03-31   5.0    50.0  下载   \n",
       "\n",
       "                                                 详细页链接  \\\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "..                                                 ...   \n",
       "945                                                NaN   \n",
       "946                                                NaN   \n",
       "947                                                NaN   \n",
       "948                                                NaN   \n",
       "949                                                NaN   \n",
       "\n",
       "                                               PDF下载链接  \n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "..                                                 ...  \n",
       "945                                                NaN  \n",
       "946                                                NaN  \n",
       "947                                                NaN  \n",
       "948                                                NaN  \n",
       "949                                                NaN  \n",
       "\n",
       "[950 rows x 11 columns]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "# 将内容表格存在本地\n",
    "with pd.ExcelWriter('知网文章数据.xlsx',mode='w',engine=\"openpyxl\") as writer:  \n",
    "            df_总表.to_excel(writer,sheet_name=\"知网\")\n",
    "display(df_总表)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 下载refworks文件及原文"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 98,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[1, 2, 3, 4, 5, 6, 7, 8, 9, 10]\n"
     ]
    }
   ],
   "source": [
    "# 导出refworks文件（.txt）和下载文章\n",
    "# 每次全选不能超过500篇，分2次进行\n",
    "pages = list(range(1,11))\n",
    "print(pages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 99,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "ename": "NoSuchElementException",
     "evalue": "Message: no such element: Unable to locate element: {\"method\":\"css selector\",\"selector\":\"[id=\"total\"]\"}\n  (Session info: chrome=91.0.4472.77)\n",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mNoSuchElementException\u001b[0m                    Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-99-d4e1693c3138>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m      1\u001b[0m \u001b[1;31m# 返回第一页\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 2\u001b[1;33m \u001b[0mdriver\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element_by_id\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'total'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mclick\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mfind_element_by_id\u001b[1;34m(self, id_)\u001b[0m\n\u001b[0;32m    358\u001b[0m             \u001b[0melement\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mdriver\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element_by_id\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'foo'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    359\u001b[0m         \"\"\"\n\u001b[1;32m--> 360\u001b[1;33m         \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mby\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mBy\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mID\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mid_\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    361\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    362\u001b[0m     \u001b[1;32mdef\u001b[0m \u001b[0mfind_elements_by_id\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mid_\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mfind_element\u001b[1;34m(self, by, value)\u001b[0m\n\u001b[0;32m    974\u001b[0m                 \u001b[0mby\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mBy\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mCSS_SELECTOR\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    975\u001b[0m                 \u001b[0mvalue\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;34m'[name=\"%s\"]'\u001b[0m \u001b[1;33m%\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 976\u001b[1;33m         return self.execute(Command.FIND_ELEMENT, {\n\u001b[0m\u001b[0;32m    977\u001b[0m             \u001b[1;34m'using'\u001b[0m\u001b[1;33m:\u001b[0m \u001b[0mby\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    978\u001b[0m             'value': value})['value']\n",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mexecute\u001b[1;34m(self, driver_command, params)\u001b[0m\n\u001b[0;32m    319\u001b[0m         \u001b[0mresponse\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcommand_executor\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mexecute\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdriver_command\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mparams\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    320\u001b[0m         \u001b[1;32mif\u001b[0m \u001b[0mresponse\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 321\u001b[1;33m             \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0merror_handler\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcheck_response\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mresponse\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    322\u001b[0m             response['value'] = self._unwrap_value(\n\u001b[0;32m    323\u001b[0m                 response.get('value', None))\n",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\errorhandler.py\u001b[0m in \u001b[0;36mcheck_response\u001b[1;34m(self, response)\u001b[0m\n\u001b[0;32m    240\u001b[0m                 \u001b[0malert_text\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;34m'alert'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'text'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    241\u001b[0m             \u001b[1;32mraise\u001b[0m \u001b[0mexception_class\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mmessage\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mscreen\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mstacktrace\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0malert_text\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 242\u001b[1;33m         \u001b[1;32mraise\u001b[0m \u001b[0mexception_class\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mmessage\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mscreen\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mstacktrace\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    243\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    244\u001b[0m     \u001b[1;32mdef\u001b[0m \u001b[0m_value_or_default\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mobj\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mkey\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mdefault\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;31mNoSuchElementException\u001b[0m: Message: no such element: Unable to locate element: {\"method\":\"css selector\",\"selector\":\"[id=\"total\"]\"}\n  (Session info: chrome=91.0.4472.77)\n"
     ]
    }
   ],
   "source": [
    "# 返回第一页\n",
    "driver.find_element_by_id('total').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 100,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 清除选中\n",
    "driver.find_element_by_xpath('//*[@id=\"gridTable\"]/div[1]/div[2]/div[1]/a').click()\n",
    "#//*[@id=\"divGroup\"]/div/a[2]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 101,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 选中页面50篇 —> 翻页\n",
    "def process_choose(pages):\n",
    "    for p in pages:\n",
    "        print (p,end='\\t')\n",
    "        全选 = driver.find_element_by_id('selectCheckAll1')\n",
    "        全选.click()\n",
    "        time.sleep(15+20*random())\n",
    "        跳转 = driver.find_element_by_id('PageNext')\n",
    "        跳转.click()\n",
    "        time.sleep(5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 102,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\t2\t3\t4\t5\t6\t7\t8\t9\t10\t"
     ]
    }
   ],
   "source": [
    "process_choose(pages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 103,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 导出与分析 \n",
    "driver.find_element_by_xpath('//i[@class=\"icon-d\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 104,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 导出文献\n",
    "driver.find_element_by_xpath('//i[@class=\"icon-r\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 107,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 点击Refworks\n",
    "driver.find_element_by_xpath('//a[@exporttype=\"Refworks\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 108,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['CDwindow-BE6D1D3D3A25740F8FBF0E2B1B7F55DE',\n",
       " 'CDwindow-5B989C7D1660390CF02ED17FD9C16541',\n",
       " 'CDwindow-42071B40A3F69F0B59B167CCDDAD64F1',\n",
       " 'CDwindow-2ADE7B546152CA75EA6C346A455A6343',\n",
       " 'CDwindow-126A05A7F81B9C3F5C97516FC6CA623E']"
      ]
     },
     "execution_count": 108,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 查看所有的窗口信息\n",
    "driver.window_handles"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 109,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-109-520070efe65b>:2: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[2])\n"
     ]
    }
   ],
   "source": [
    "# 窗口切换\n",
    "driver.switch_to_window(driver.window_handles[2])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 110,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 导出 .txt文件\n",
    "driver.find_element_by_xpath('//i[@class=\"icon icon-export\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 122,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-122-0188c2a7ff70>:2: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[1])\n"
     ]
    }
   ],
   "source": [
    "# 窗口切换\n",
    "driver.switch_to_window(driver.window_handles[1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 123,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "ename": "NoSuchElementException",
     "evalue": "Message: no such element: Unable to locate element: {\"method\":\"xpath\",\"selector\":\"//*[@id=\"gridTable\"]/div[1]/div[2]/div[1]/a\"}\n  (Session info: chrome=91.0.4472.77)\n",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mNoSuchElementException\u001b[0m                    Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-123-d9f0fad6cfc6>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m      1\u001b[0m \u001b[1;31m# 清除选择\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 2\u001b[1;33m \u001b[0mdriver\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element_by_xpath\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'//*[@id=\"gridTable\"]/div[1]/div[2]/div[1]/a'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mclick\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mfind_element_by_xpath\u001b[1;34m(self, xpath)\u001b[0m\n\u001b[0;32m    392\u001b[0m             \u001b[0melement\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mdriver\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element_by_xpath\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'//div/td[1]'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    393\u001b[0m         \"\"\"\n\u001b[1;32m--> 394\u001b[1;33m         \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mby\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mBy\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mXPATH\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mxpath\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    395\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    396\u001b[0m     \u001b[1;32mdef\u001b[0m \u001b[0mfind_elements_by_xpath\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mxpath\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mfind_element\u001b[1;34m(self, by, value)\u001b[0m\n\u001b[0;32m    974\u001b[0m                 \u001b[0mby\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mBy\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mCSS_SELECTOR\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    975\u001b[0m                 \u001b[0mvalue\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;34m'[name=\"%s\"]'\u001b[0m \u001b[1;33m%\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 976\u001b[1;33m         return self.execute(Command.FIND_ELEMENT, {\n\u001b[0m\u001b[0;32m    977\u001b[0m             \u001b[1;34m'using'\u001b[0m\u001b[1;33m:\u001b[0m \u001b[0mby\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    978\u001b[0m             'value': value})['value']\n",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mexecute\u001b[1;34m(self, driver_command, params)\u001b[0m\n\u001b[0;32m    319\u001b[0m         \u001b[0mresponse\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcommand_executor\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mexecute\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdriver_command\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mparams\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    320\u001b[0m         \u001b[1;32mif\u001b[0m \u001b[0mresponse\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 321\u001b[1;33m             \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0merror_handler\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcheck_response\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mresponse\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    322\u001b[0m             response['value'] = self._unwrap_value(\n\u001b[0;32m    323\u001b[0m                 response.get('value', None))\n",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\errorhandler.py\u001b[0m in \u001b[0;36mcheck_response\u001b[1;34m(self, response)\u001b[0m\n\u001b[0;32m    240\u001b[0m                 \u001b[0malert_text\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;34m'alert'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'text'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    241\u001b[0m             \u001b[1;32mraise\u001b[0m \u001b[0mexception_class\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mmessage\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mscreen\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mstacktrace\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0malert_text\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 242\u001b[1;33m         \u001b[1;32mraise\u001b[0m \u001b[0mexception_class\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mmessage\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mscreen\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mstacktrace\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    243\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    244\u001b[0m     \u001b[1;32mdef\u001b[0m \u001b[0m_value_or_default\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mobj\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mkey\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mdefault\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;31mNoSuchElementException\u001b[0m: Message: no such element: Unable to locate element: {\"method\":\"xpath\",\"selector\":\"//*[@id=\"gridTable\"]/div[1]/div[2]/div[1]/a\"}\n  (Session info: chrome=91.0.4472.77)\n"
     ]
    }
   ],
   "source": [
    "# 清除选择\n",
    "driver.find_element_by_xpath('//*[@id=\"gridTable\"]/div[1]/div[2]/div[1]/a').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 118,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[10, 11, 12, 13, 14, 15, 16, 17, 18]\n"
     ]
    }
   ],
   "source": [
    "# 第二轮下载\n",
    "pages = list(range(10,19))\n",
    "print(pages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 121,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "10\t"
     ]
    },
    {
     "ename": "NoSuchElementException",
     "evalue": "Message: no such element: Unable to locate element: {\"method\":\"css selector\",\"selector\":\"[id=\"selectCheckAll1\"]\"}\n  (Session info: chrome=91.0.4472.77)\n",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mNoSuchElementException\u001b[0m                    Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-121-5d9228d2e8c5>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[1;32m----> 1\u001b[1;33m \u001b[0mprocess_choose\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mpages\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m",
      "\u001b[1;32m<ipython-input-101-cec042122afd>\u001b[0m in \u001b[0;36mprocess_choose\u001b[1;34m(pages)\u001b[0m\n\u001b[0;32m      3\u001b[0m     \u001b[1;32mfor\u001b[0m \u001b[0mp\u001b[0m \u001b[1;32min\u001b[0m \u001b[0mpages\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      4\u001b[0m         \u001b[0mprint\u001b[0m \u001b[1;33m(\u001b[0m\u001b[0mp\u001b[0m\u001b[1;33m,\u001b[0m\u001b[0mend\u001b[0m\u001b[1;33m=\u001b[0m\u001b[1;34m'\\t'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 5\u001b[1;33m         \u001b[0m全选\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mdriver\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element_by_id\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'selectCheckAll1'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m      6\u001b[0m         \u001b[0m全选\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mclick\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m      7\u001b[0m         \u001b[0mtime\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0msleep\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;36m15\u001b[0m\u001b[1;33m+\u001b[0m\u001b[1;36m20\u001b[0m\u001b[1;33m*\u001b[0m\u001b[0mrandom\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mfind_element_by_id\u001b[1;34m(self, id_)\u001b[0m\n\u001b[0;32m    358\u001b[0m             \u001b[0melement\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mdriver\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element_by_id\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'foo'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    359\u001b[0m         \"\"\"\n\u001b[1;32m--> 360\u001b[1;33m         \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mby\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mBy\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mID\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mid_\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    361\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    362\u001b[0m     \u001b[1;32mdef\u001b[0m \u001b[0mfind_elements_by_id\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mid_\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mfind_element\u001b[1;34m(self, by, value)\u001b[0m\n\u001b[0;32m    974\u001b[0m                 \u001b[0mby\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mBy\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mCSS_SELECTOR\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    975\u001b[0m                 \u001b[0mvalue\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;34m'[name=\"%s\"]'\u001b[0m \u001b[1;33m%\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 976\u001b[1;33m         return self.execute(Command.FIND_ELEMENT, {\n\u001b[0m\u001b[0;32m    977\u001b[0m             \u001b[1;34m'using'\u001b[0m\u001b[1;33m:\u001b[0m \u001b[0mby\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    978\u001b[0m             'value': value})['value']\n",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mexecute\u001b[1;34m(self, driver_command, params)\u001b[0m\n\u001b[0;32m    319\u001b[0m         \u001b[0mresponse\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcommand_executor\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mexecute\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdriver_command\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mparams\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    320\u001b[0m         \u001b[1;32mif\u001b[0m \u001b[0mresponse\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 321\u001b[1;33m             \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0merror_handler\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcheck_response\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mresponse\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    322\u001b[0m             response['value'] = self._unwrap_value(\n\u001b[0;32m    323\u001b[0m                 response.get('value', None))\n",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\errorhandler.py\u001b[0m in \u001b[0;36mcheck_response\u001b[1;34m(self, response)\u001b[0m\n\u001b[0;32m    240\u001b[0m                 \u001b[0malert_text\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;34m'alert'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'text'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    241\u001b[0m             \u001b[1;32mraise\u001b[0m \u001b[0mexception_class\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mmessage\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mscreen\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mstacktrace\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0malert_text\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 242\u001b[1;33m         \u001b[1;32mraise\u001b[0m \u001b[0mexception_class\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mmessage\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mscreen\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mstacktrace\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    243\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    244\u001b[0m     \u001b[1;32mdef\u001b[0m \u001b[0m_value_or_default\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mobj\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mkey\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mdefault\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;31mNoSuchElementException\u001b[0m: Message: no such element: Unable to locate element: {\"method\":\"css selector\",\"selector\":\"[id=\"selectCheckAll1\"]\"}\n  (Session info: chrome=91.0.4472.77)\n"
     ]
    }
   ],
   "source": [
    "process_choose(pages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 120,
   "metadata": {
    "collapsed": true
   },
   "outputs": [
    {
     "ename": "NoSuchElementException",
     "evalue": "Message: no such element: Unable to locate element: {\"method\":\"xpath\",\"selector\":\"//i[@class=\"icon-d\"]\"}\n  (Session info: chrome=91.0.4472.77)\n",
     "output_type": "error",
     "traceback": [
      "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
      "\u001b[1;31mNoSuchElementException\u001b[0m                    Traceback (most recent call last)",
      "\u001b[1;32m<ipython-input-120-3215e5db7d25>\u001b[0m in \u001b[0;36m<module>\u001b[1;34m\u001b[0m\n\u001b[0;32m      1\u001b[0m \u001b[1;31m# 导出与分析\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m----> 2\u001b[1;33m \u001b[0mdriver\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element_by_xpath\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'//i[@class=\"icon-d\"]'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mclick\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mfind_element_by_xpath\u001b[1;34m(self, xpath)\u001b[0m\n\u001b[0;32m    392\u001b[0m             \u001b[0melement\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mdriver\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element_by_xpath\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'//div/td[1]'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    393\u001b[0m         \"\"\"\n\u001b[1;32m--> 394\u001b[1;33m         \u001b[1;32mreturn\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mfind_element\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mby\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mBy\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mXPATH\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m=\u001b[0m\u001b[0mxpath\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    395\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    396\u001b[0m     \u001b[1;32mdef\u001b[0m \u001b[0mfind_elements_by_xpath\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mxpath\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mfind_element\u001b[1;34m(self, by, value)\u001b[0m\n\u001b[0;32m    974\u001b[0m                 \u001b[0mby\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mBy\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mCSS_SELECTOR\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    975\u001b[0m                 \u001b[0mvalue\u001b[0m \u001b[1;33m=\u001b[0m \u001b[1;34m'[name=\"%s\"]'\u001b[0m \u001b[1;33m%\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 976\u001b[1;33m         return self.execute(Command.FIND_ELEMENT, {\n\u001b[0m\u001b[0;32m    977\u001b[0m             \u001b[1;34m'using'\u001b[0m\u001b[1;33m:\u001b[0m \u001b[0mby\u001b[0m\u001b[1;33m,\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    978\u001b[0m             'value': value})['value']\n",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\webdriver.py\u001b[0m in \u001b[0;36mexecute\u001b[1;34m(self, driver_command, params)\u001b[0m\n\u001b[0;32m    319\u001b[0m         \u001b[0mresponse\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcommand_executor\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mexecute\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mdriver_command\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mparams\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    320\u001b[0m         \u001b[1;32mif\u001b[0m \u001b[0mresponse\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 321\u001b[1;33m             \u001b[0mself\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0merror_handler\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mcheck_response\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mresponse\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    322\u001b[0m             response['value'] = self._unwrap_value(\n\u001b[0;32m    323\u001b[0m                 response.get('value', None))\n",
      "\u001b[1;32m~\\anaconda3\\lib\\site-packages\\selenium\\webdriver\\remote\\errorhandler.py\u001b[0m in \u001b[0;36mcheck_response\u001b[1;34m(self, response)\u001b[0m\n\u001b[0;32m    240\u001b[0m                 \u001b[0malert_text\u001b[0m \u001b[1;33m=\u001b[0m \u001b[0mvalue\u001b[0m\u001b[1;33m[\u001b[0m\u001b[1;34m'alert'\u001b[0m\u001b[1;33m]\u001b[0m\u001b[1;33m.\u001b[0m\u001b[0mget\u001b[0m\u001b[1;33m(\u001b[0m\u001b[1;34m'text'\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    241\u001b[0m             \u001b[1;32mraise\u001b[0m \u001b[0mexception_class\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mmessage\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mscreen\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mstacktrace\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0malert_text\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[1;32m--> 242\u001b[1;33m         \u001b[1;32mraise\u001b[0m \u001b[0mexception_class\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mmessage\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mscreen\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mstacktrace\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0m\u001b[0;32m    243\u001b[0m \u001b[1;33m\u001b[0m\u001b[0m\n\u001b[0;32m    244\u001b[0m     \u001b[1;32mdef\u001b[0m \u001b[0m_value_or_default\u001b[0m\u001b[1;33m(\u001b[0m\u001b[0mself\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mobj\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mkey\u001b[0m\u001b[1;33m,\u001b[0m \u001b[0mdefault\u001b[0m\u001b[1;33m)\u001b[0m\u001b[1;33m:\u001b[0m\u001b[1;33m\u001b[0m\u001b[1;33m\u001b[0m\u001b[0m\n",
      "\u001b[1;31mNoSuchElementException\u001b[0m: Message: no such element: Unable to locate element: {\"method\":\"xpath\",\"selector\":\"//i[@class=\"icon-d\"]\"}\n  (Session info: chrome=91.0.4472.77)\n"
     ]
    }
   ],
   "source": [
    "# 导出与分析 \n",
    "driver.find_element_by_xpath('//i[@class=\"icon-d\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 59,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 导出文献\n",
    "driver.find_element_by_xpath('//i[@class=\"icon-r\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 60,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 点击Refworks\n",
    "driver.find_element_by_xpath('//a[@exporttype=\"Refworks\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 61,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['CDwindow-8D8283095CD2D3246CFBF4EE753ABEC4',\n",
       " 'CDwindow-1CD9E637B649BF5766B745C8B5E27E72',\n",
       " 'CDwindow-76303F9E7B0196950BA7E3B3787CD2C3',\n",
       " 'CDwindow-04AC7C2142B82E9212C4D1F1C312DEFF',\n",
       " 'CDwindow-E563C48D1DBA037EBF38E4136C95541F']"
      ]
     },
     "execution_count": 61,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 查看所有的窗口信息\n",
    "driver.window_handles"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 62,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-62-ecda85629064>:2: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[4])\n"
     ]
    }
   ],
   "source": [
    "# 窗口切换\n",
    "driver.switch_to_window(driver.window_handles[4])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 63,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 导出 .txt文件\n",
    "driver.find_element_by_xpath('//i[@class=\"icon icon-export\"]').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 64,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-64-0188c2a7ff70>:2: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[1])\n"
     ]
    }
   ],
   "source": [
    "# 窗口切换\n",
    "driver.switch_to_window(driver.window_handles[1])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 124,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 批量下载\n",
    "# 调用百度文字识别API\n",
    "import base64\n",
    "import requests \n",
    "from selenium.webdriver.common.by import By\n",
    "\n",
    "def shibie(img):\n",
    "    host = 'https://aip.baidubce.com/oauth/2.0/token?grant_type=client_credentials&client_id=oo62GrYfPSYE9BtoyaSnuOUu&client_secret=xVdPBkUqRSXDZe3mW9MSzIo2d4qwHhB0'\n",
    "    response = requests.get(host)\n",
    "    if response:\n",
    "        respond=response.json()\n",
    "        request_url = \"https://aip.baidubce.com/rest/2.0/ocr/v1/accurate_basic\"\n",
    "    \n",
    "        f = open(img, 'rb')\n",
    "        img = base64.b64encode(f.read())\n",
    "        params = {\"image\":img}\n",
    "        \n",
    "        access_token = '25.3f299829a304d185329781dc942e373b.315360000.1940772255.282335-24492968' # 自行生成并填写\n",
    "        request_url = request_url + \"?access_token=\" + access_token\n",
    "        headers = {'content-type': 'application/x-www-form-urlencoded'}\n",
    "        response = requests.post(request_url, data=params, headers=headers)\n",
    "        if response:\n",
    "            word=response.json()\n",
    "            if word[\"words_result\"]:\n",
    "                return word[\"words_result\"][0]['words'].replace(\" \",\"\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 125,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-125-0dfe2a1ada8f>:1: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[2])\n"
     ]
    }
   ],
   "source": [
    "driver.switch_to_window(driver.window_handles[2])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\n",
      "2\n",
      "3\n",
      "4\n",
      "5\n",
      "6\n",
      "7\n",
      "8\n",
      "9\n"
     ]
    }
   ],
   "source": [
    "# 批量下载\n",
    "download_num = 0\n",
    "\n",
    "for url in df_总表[\"PDF下载链接\"]:\n",
    "    try:\n",
    "        time.sleep(2)\n",
    "        driver.get(url)\n",
    "        download_num += 1\n",
    "        print(download_num)\n",
    "        if driver.find_element_by_xpath('//*[@id=\"vImg\"]'):\n",
    "            ele = driver.find_element(By.CSS_SELECTOR, '#vImg') # 验证码截图\n",
    "            ele.screenshot('./image.png')\n",
    "            img='./image.png'\n",
    "            shuru=shibie(img)\n",
    "            driver.find_element_by_xpath('//*[@id=\"vcode\"]').send_keys(shuru)\n",
    "            time.sleep(5)\n",
    "            driver.find_element_by_xpath('/html/body/div/form/dl/dd/button').click()\n",
    "        else:\n",
    "            time.sleep(10)\n",
    "    except:\n",
    "        continue"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.3"
  },
  "toc": {
   "base_numbering": 1,
   "nav_menu": {},
   "number_sections": true,
   "sideBar": true,
   "skip_h1_title": false,
   "title_cell": "Table of Contents",
   "title_sidebar": "Contents",
   "toc_cell": false,
   "toc_position": {},
   "toc_section_display": true,
   "toc_window_display": false
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
